2014-11-23 14:41:03 -05:00
# coding: utf-8
2014-10-24 09:09:43 -04:00
from __future__ import unicode_literals
from . common import InfoExtractor
2015-05-07 10:07:11 -04:00
from . . utils import (
2015-05-07 10:09:27 -04:00
int_or_none ,
fix_xml_ampersands ,
2015-05-07 10:07:11 -04:00
)
2014-10-24 09:09:43 -04:00
class BildIE ( InfoExtractor ) :
_VALID_URL = r ' https?://(?:www \ .)?bild \ .de/(?:[^/]+/)+(?P<display_id>[^/]+)-(?P<id> \ d+)(?:,auto=true)? \ .bild \ .html '
IE_DESC = ' Bild.de '
_TEST = {
' url ' : ' http://www.bild.de/video/clip/apple-ipad-air/das-koennen-die-neuen-ipads-38184146.bild.html ' ,
' md5 ' : ' dd495cbd99f2413502a1713a1156ac8a ' ,
' info_dict ' : {
' id ' : ' 38184146 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' BILD hat sie getestet ' ,
2015-05-07 10:20:43 -04:00
' thumbnail ' : ' re:^https?://.* \ .jpg$ ' ,
2014-10-24 09:09:43 -04:00
' duration ' : 196 ,
' description ' : ' Mit dem iPad Air 2 und dem iPad Mini 3 hat Apple zwei neue Tablet-Modelle präsentiert. BILD-Reporter Sven Stein durfte die Geräte bereits testen. ' ,
}
}
def _real_extract ( self , url ) :
video_id = self . _match_id ( url )
xml_url = url . split ( " .bild.html " ) [ 0 ] + " ,view=xml.bild.xml "
2015-05-07 10:07:11 -04:00
doc = self . _download_xml ( xml_url , video_id , transform_source = fix_xml_ampersands )
2014-10-24 09:09:43 -04:00
duration = int_or_none ( doc . attrib . get ( ' duration ' ) , scale = 1000 )
return {
' id ' : video_id ,
' title ' : doc . attrib [ ' ueberschrift ' ] ,
' description ' : doc . attrib . get ( ' text ' ) ,
' url ' : doc . attrib [ ' src ' ] ,
' thumbnail ' : doc . attrib . get ( ' img ' ) ,
' duration ' : duration ,
}