[eitb] fix info extraction
[youtube-dl] / youtube_dl / extractor / eitb.py
1 # encoding: utf-8
2 from __future__ import unicode_literals
3
4 from .common import InfoExtractor
5 from ..compat import compat_urllib_request
6 from ..utils import (
7     int_or_none,
8     unified_strdate,
9 )
10
11
12 class EitbIE(InfoExtractor):
13     IE_NAME = 'eitb.tv'
14     _VALID_URL = r'https?://www\.eitb\.tv/(eu/bideoa|es/video)/[^/]+/\d+/(?P<id>\d+)'
15
16     _TEST = {
17         'url': 'http://www.eitb.tv/es/video/60-minutos-60-minutos-2013-2014/4104995148001/4090227752001/lasa-y-zabala-30-anos/',
18         'md5': 'edf4436247185adee3ea18ce64c47998',
19         'info_dict': {
20             'id': '4090227752001',
21             'ext': 'mp4',
22             'title': '60 minutos (Lasa y Zabala, 30 aƱos)',
23             'description': '',
24             'duration': 3996760,
25             'upload_date': '20131014',
26         },
27     }
28
29     def _real_extract(self, url):
30         video_id = self._match_id(url)
31         video_data = self._download_json('http://mam.eitb.eus/mam/REST/ServiceMultiweb/Video/MULTIWEBTV/%s/' % video_id, video_id)['web_media'][0]
32
33         formats = []
34         for rendition in video_data['RENDITIONS']:
35             formats.append({
36                 'url': rendition['PMD_URL'],
37                 'width': int_or_none(rendition.get('FRAME_WIDTH')),
38                 'height': int_or_none(rendition.get('FRAME_HEIGHT')),
39                 'tbr': int_or_none(rendition.get('ENCODING_RATE')),
40             })
41
42         # TODO: parse f4m manifest
43         request = compat_urllib_request.Request(
44             'http://mam.eitb.eus/mam/REST/ServiceMultiweb/DomainRestrictedSecurity/TokenAuth/',
45             headers={'Referer': url})
46         token_data = self._download_json(request, video_id, fatal=False)
47         if token_data:
48             m3u8_formats = self._extract_m3u8_formats('%s?hdnts=%s' % (video_data['HLS_SURL'], token_data['token']), video_id, m3u8_id='hls', fatal=False)
49             if m3u8_formats:
50                 formats.extend(m3u8_formats)
51
52         self._sort_formats(formats)
53
54         return {
55             'id': video_id,
56             'title': video_data['NAME_ES'],
57             'description': video_data.get('SHORT_DESC_ES'),
58             'thumbnail': video_data.get('STILL_URL'),
59             'duration': int_or_none(video_data.get('LENGTH')),
60             'upload_date': unified_strdate(video_data.get('BROADCST_DATE')),
61             'formats': formats,
62         }