X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=blobdiff_plain;f=youtube_dl%2Fextractor%2Ftagesschau.py;h=b870474515ba61ee33641c86554d53d68a6bf46d;hb=cc7fec5818254f4679896823c7de9d17f50201ca;hp=bd935063f3b6e327e6fe3e47b5a119af01cd07da;hpb=7ffad0af5ab392ed5ea7ec9165fd42d012a669f5;p=youtube-dl diff --git a/youtube_dl/extractor/tagesschau.py b/youtube_dl/extractor/tagesschau.py index bd935063f..b87047451 100644 --- a/youtube_dl/extractor/tagesschau.py +++ b/youtube_dl/extractor/tagesschau.py @@ -7,7 +7,7 @@ from .common import InfoExtractor class TagesschauIE(InfoExtractor): - _VALID_URL = r'https?://(?:www\.)?tagesschau\.de/multimedia/video/video(?P-?\d+)\.html' + _VALID_URL = r'https?://(?:www\.)?tagesschau\.de/multimedia/video/video(?P-?[0-9]+)\.html' _TESTS = [{ 'url': 'http://www.tagesschau.de/multimedia/video/video1399128.html', @@ -19,17 +19,13 @@ class TagesschauIE(InfoExtractor): 'description': 'md5:69da3c61275b426426d711bde96463ab', 'thumbnail': 're:^http:.*\.jpg$', }, - }, { - 'url': 'http://www.tagesschau.de/multimedia/video/video-196.html', - 'md5': '8aaa8bf3ae1ca2652309718c03019128', - 'info_dict': { - 'id': '196', - 'ext': 'mp4', - 'title': 'Ukraine-Konflikt: Klitschko in Kiew als B\xfcrgermeister vereidigt', - 'description': 'md5:f22e4af75821d174fa6c977349682691', - 'thumbnail': 're:http://.*\.jpg', - }, - }] + }] + + _FORMATS = { + 's': {'width': 256, 'height': 144, 'quality': 1}, + 'm': {'width': 512, 'height': 288, 'quality': 2}, + 'l': {'width': 960, 'height': 544, 'quality': 3}, + } def _real_extract(self, url): mobj = re.match(self._VALID_URL, url) @@ -43,29 +39,22 @@ class TagesschauIE(InfoExtractor): webpage = self._download_webpage(url, display_id) playerpage = self._download_webpage( - 'http://www.tagesschau.de/multimedia/video/video%s~player_autoplay-true.html' % video_id, display_id) + 'http://www.tagesschau.de/multimedia/video/video%s~player_autoplay-true.html' % video_id, + display_id, 'Downloading player page') - medias = re.findall(r'"(http://media.+?)", type:"video/(.+?)", quality:"(.+?)"', playerpage) + medias = re.findall( + r'"(http://media.+?)", type:"video/(.+?)", quality:"(.+?)"', + playerpage) formats = [] for url, ext, res in medias: - - if res == 's': - res = 'small' - quality = 0 - elif res == 'm': - res = 'medium' - quality = 1 - elif res == 'l': - res = 'large' - quality = 2 - - formats.append({ - 'format_id': res+'_'+ext, + f = { + 'format_id': res + '_' + ext, 'url': url, - 'quality': quality, 'ext': ext, - }) + } + f.update(self._FORMATS.get(res, {})) + formats.append(f) self._sort_formats(formats) @@ -74,7 +63,7 @@ class TagesschauIE(InfoExtractor): return { 'id': display_id, 'title': self._og_search_title(webpage).strip(), - 'thumbnail': 'http://www.tagesschau.de'+thumbnail, + 'thumbnail': 'http://www.tagesschau.de' + thumbnail, 'formats': formats, 'description': self._og_search_description(webpage).strip(), }