[once] Add new format extractor
[youtube-dl] / youtube_dl / extractor / once.py
1 # coding: utf-8
2 from __future__ import unicode_literals
3
4 import re
5
6 from .common import InfoExtractor
7
8
9 class OnceIE(InfoExtractor):
10     _VALID_URL = r'https?://once\.unicornmedia\.com/now/[^/]+/[^/]+/(?P<domain_id>[^/]+)/(?P<application_id>[^/]+)/(?:[^/]+/)?(?P<media_item_id>[^/]+)/content\.(?:once|m3u8|mp4)'
11     ADAPTIVE_URL_TEMPLATE = 'http://once.unicornmedia.com/now/master/playlist/%s/%s/%s/content.m3u8'
12     PROGRESSIVE_URL_TEMPLATE = 'http://once.unicornmedia.com/now/media/progressive/%s/%s/%s/%s/content.mp4'
13
14     def _extract_once_formats(self, url):
15         domain_id, application_id, media_item_id = re.match(
16             OnceIE._VALID_URL, url).groups()
17         adaptive_formats = self._extract_m3u8_formats(
18             self.ADAPTIVE_URL_TEMPLATE % (
19                 domain_id, application_id, media_item_id),
20             media_item_id, 'mp4', m3u8_id='hls', fatal=False)
21         formats = []
22         formats.extend(adaptive_formats)
23         for adaptive_format in adaptive_formats:
24             rendition_id = self._search_regex(
25                 r'/now/media/playlist/[^/]+/[^/]+/([^/]+)',
26                 adaptive_format['url'], 'redition id', default=None)
27             if rendition_id:
28                 progressive_format = adaptive_format.copy()
29                 progressive_format.update({
30                     'url': self.PROGRESSIVE_URL_TEMPLATE % (
31                         domain_id, application_id, rendition_id, media_item_id),
32                     'format_id': adaptive_format['format_id'].replace(
33                         'hls', 'http'),
34                     'protocol': 'http',
35                 })
36                 formats.append(progressive_format)
37         return formats