2 from __future__ import unicode_literals
4 from .common import InfoExtractor
15 class DRTVIE(InfoExtractor):
16 _VALID_URL = r'https?://(?:www\.)?dr\.dk/(?:tv/se|nyheder)/(?:[^/]+/)*(?P<id>[\da-z-]+)(?:[/#?]|$)'
19 'url': 'https://www.dr.dk/tv/se/boern/ultra/panisk-paske/panisk-paske-5',
20 'md5': 'dc515a9ab50577fa14cc4e4b0265168f',
22 'id': 'panisk-paske-5',
24 'title': 'Panisk Påske (5)',
25 'description': 'md5:ca14173c5ab24cd26b0fcc074dff391c',
26 'timestamp': 1426984612,
27 'upload_date': '20150322',
30 'skip': 'Video is no longer available',
32 'url': 'https://www.dr.dk/nyheder/indland/live-christianias-rydning-af-pusher-street-er-i-gang',
33 'md5': '2ada5074f9e79afc0d324a8e9784d850',
35 'id': 'christiania-pusher-street-ryddes-drdkrjpo',
37 'title': 'LIVE Christianias rydning af Pusher Street er i gang',
38 'description': '- Det er det fedeste, der er sket i 20 år, fortæller christianit til DR Nyheder.',
39 'timestamp': 1472800279,
40 'upload_date': '20160902',
45 def _real_extract(self, url):
46 video_id = self._match_id(url)
48 webpage = self._download_webpage(url, video_id)
50 if '>Programmet er ikke længere tilgængeligt' in webpage:
52 'Video %s is not available' % video_id, expected=True)
54 video_id = self._search_regex(
55 (r'data-(?:material-identifier|episode-slug)="([^"]+)"',
56 r'data-resource="[^>"]+mu/programcard/expanded/([^"]+)"'),
59 programcard = self._download_json(
60 'http://www.dr.dk/mu/programcard/expanded/%s' % video_id,
61 video_id, 'Downloading video JSON')
62 data = programcard['Data'][0]
64 title = remove_end(self._og_search_title(
65 webpage, default=None), ' | TV | DR') or data['Title']
66 description = self._og_search_description(
67 webpage, default=None) or data.get('Description')
69 timestamp = parse_iso8601(data.get('CreatedTime'))
74 restricted_to_denmark = False
79 for asset in data['Assets']:
80 if asset.get('Kind') == 'Image':
81 thumbnail = asset.get('Uri')
82 elif asset.get('Kind') == 'VideoResource':
83 duration = float_or_none(asset.get('DurationInMilliseconds'), 1000)
84 restricted_to_denmark = asset.get('RestrictedToDenmark')
85 spoken_subtitles = asset.get('Target') == 'SpokenSubtitles'
86 for link in asset.get('Links', []):
90 target = link.get('Target')
91 format_id = target or ''
95 format_id += '-spoken-subtitles'
97 formats.extend(self._extract_f4m_formats(
98 uri + '?hdcore=3.3.0&plugin=aasp-3.3.0.99.43',
99 video_id, preference, f4m_id=format_id))
100 elif target == 'HLS':
101 formats.extend(self._extract_m3u8_formats(
102 uri, video_id, 'mp4', entry_protocol='m3u8_native',
103 preference=preference, m3u8_id=format_id))
105 bitrate = link.get('Bitrate')
107 format_id += '-%s' % bitrate
110 'format_id': format_id,
111 'tbr': int_or_none(bitrate),
112 'ext': link.get('FileFormat'),
114 subtitles_list = asset.get('SubtitlesList')
115 if isinstance(subtitles_list, list):
119 for subs in subtitles_list:
120 if not subs.get('Uri'):
122 lang = subs.get('Language') or 'da'
123 subtitles.setdefault(LANGS.get(lang, lang), []).append({
125 'ext': mimetype2ext(subs.get('MimeType')) or 'vtt'
128 if not formats and restricted_to_denmark:
129 self.raise_geo_restricted(
130 'Unfortunately, DR is not allowed to show this program outside Denmark.',
133 self._sort_formats(formats)
138 'description': description,
139 'thumbnail': thumbnail,
140 'timestamp': timestamp,
141 'duration': duration,
143 'subtitles': subtitles,