[kanalplay] Add extractor (Closes #5188)
[youtube-dl] / youtube_dl / extractor / kanalplay.py
1 # coding: utf-8
2 from __future__ import unicode_literals
3
4 import re
5
6 from .common import InfoExtractor
7 from ..utils import (
8     ExtractorError,
9     float_or_none,
10 )
11
12
13 class KanalPlayIE(InfoExtractor):
14     IE_DESC = 'Kanal 5/9/11 Play'
15     _VALID_URL = r'https?://(?:www\.)?kanal(?P<channel_id>5|9|11)play\.se/(?:#!/)?(?:play/)?program/\d+/video/(?P<id>\d+)'
16     _TESTS = [{
17         'url': 'http://www.kanal5play.se/#!/play/program/3060212363/video/3270012277',
18         'md5': '',
19         'info_dict': {
20             'id': '2609989',
21             'ext': 'flv',
22             'title': 'Saknar både dusch och avlopp',
23             'description': 'md5:',
24             'duration': 2636.36,
25         },
26     }, {
27         'url': 'http://www.kanal9play.se/#!/play/program/335032/video/246042',
28         'only_matching': True,
29     }, {
30         'url': 'http://www.kanal11play.se/#!/play/program/232835958/video/367135199',
31         'only_matching': True,
32     }]
33
34     def _real_extract(self, url):
35         mobj = re.match(self._VALID_URL, url)
36         video_id = mobj.group('id')
37         channel_id = mobj.group('channel_id')
38
39         video = self._download_json(
40             'http://www.kanal%splay.se/api/getVideo?format=FLASH&videoId=%s' % (channel_id, video_id),
41             video_id)
42
43         reasons_for_no_streams = video.get('reasonsForNoStreams')
44         if reasons_for_no_streams:
45             raise ExtractorError(
46                 '%s returned error: %s' % (self.IE_NAME, '\n'.join(reasons_for_no_streams)),
47                 expected=True)
48
49         title = video['title']
50         description = video.get('description')
51         duration = float_or_none(video.get('length'), 1000)
52         thumbnail = video.get('posterUrl')
53
54         stream_base_url = video['streamBaseUrl']
55
56         formats = [{
57             'url': stream_base_url,
58             'play_path': stream['source'],
59             'ext': 'flv',
60             'tbr': float_or_none(stream.get('bitrate'), 1000),
61             'rtmp_real_time': True,
62         } for stream in video['streams']]
63         self._sort_formats(formats)
64
65         return {
66             'id': video_id,
67             'title': title,
68             'description': description,
69             'thumbnail': thumbnail,
70             'duration': duration,
71             'formats': formats,
72         }