2 from __future__ import unicode_literals
4 from .common import InfoExtractor
12 class DRTVIE(InfoExtractor):
13 _VALID_URL = r'https?://(?:www\.)?dr\.dk/(?:tv/se|nyheder)/(?:[^/]+/)*(?P<id>[\da-z-]+)(?:[/#?]|$)'
16 'url': 'https://www.dr.dk/tv/se/boern/ultra/panisk-paske/panisk-paske-5',
17 'md5': 'dc515a9ab50577fa14cc4e4b0265168f',
19 'id': 'panisk-paske-5',
21 'title': 'Panisk Påske (5)',
22 'description': 'md5:ca14173c5ab24cd26b0fcc074dff391c',
23 'timestamp': 1426984612,
24 'upload_date': '20150322',
27 'skip': 'Video is no longer available',
29 'url': 'https://www.dr.dk/nyheder/indland/live-christianias-rydning-af-pusher-street-er-i-gang',
30 'md5': '2ada5074f9e79afc0d324a8e9784d850',
32 'id': 'christiania-pusher-street-ryddes-drdkrjpo',
34 'title': 'LIVE Christianias rydning af Pusher Street er i gang',
35 'description': '- Det er det fedeste, der er sket i 20 år, fortæller christianit til DR Nyheder.',
36 'timestamp': 1472800279,
37 'upload_date': '20160902',
42 def _real_extract(self, url):
43 video_id = self._match_id(url)
45 webpage = self._download_webpage(url, video_id)
47 if '>Programmet er ikke længere tilgængeligt' in webpage:
49 'Video %s is not available' % video_id, expected=True)
51 video_id = self._search_regex(
52 (r'data-(?:material-identifier|episode-slug)="([^"]+)"',
53 r'data-resource="[^>"]+mu/programcard/expanded/([^"]+)"'),
56 programcard = self._download_json(
57 'http://www.dr.dk/mu/programcard/expanded/%s' % video_id,
58 video_id, 'Downloading video JSON')
59 data = programcard['Data'][0]
61 title = remove_end(self._og_search_title(webpage), ' | TV | DR') or data['Title']
62 description = self._og_search_description(webpage) or data['Description']
64 timestamp = parse_iso8601(data['CreatedTime'])
69 restricted_to_denmark = False
74 for asset in data['Assets']:
75 if asset['Kind'] == 'Image':
76 thumbnail = asset['Uri']
77 elif asset['Kind'] == 'VideoResource':
78 duration = asset['DurationInMilliseconds'] / 1000.0
79 restricted_to_denmark = asset['RestrictedToDenmark']
80 spoken_subtitles = asset['Target'] == 'SpokenSubtitles'
81 for link in asset['Links']:
83 target = link['Target']
88 format_id += '-spoken-subtitles'
90 formats.extend(self._extract_f4m_formats(
91 uri + '?hdcore=3.3.0&plugin=aasp-3.3.0.99.43',
92 video_id, preference, f4m_id=format_id))
94 formats.extend(self._extract_m3u8_formats(
95 uri, video_id, 'mp4', preference=preference,
98 bitrate = link.get('Bitrate')
100 format_id += '-%s' % bitrate
103 'format_id': format_id,
105 'ext': link.get('FileFormat'),
107 subtitles_list = asset.get('SubtitlesList')
108 if isinstance(subtitles_list, list):
112 for subs in subtitles_list:
113 lang = subs['Language']
114 subtitles[LANGS.get(lang, lang)] = [{'url': subs['Uri'], 'ext': 'vtt'}]
116 if not formats and restricted_to_denmark:
117 raise ExtractorError(
118 'Unfortunately, DR is not allowed to show this program outside Denmark.', expected=True)
120 self._sort_formats(formats)
125 'description': description,
126 'thumbnail': thumbnail,
127 'timestamp': timestamp,
128 'duration': duration,
130 'subtitles': subtitles,