[youtube] Fix extraction.
[youtube-dl] / youtube_dl / extractor / sportdeutschland.py
index 9d54043e5ba7ad50d27d088b133fdc376dddfa4c..378fc75686313f92a846aaa30579049e9a29eccc 100644 (file)
@@ -5,62 +5,67 @@ import re
 
 from .common import InfoExtractor
 from ..utils import (
-    compat_urllib_request,
     parse_iso8601,
+    sanitized_Request,
 )
 
 
 class SportDeutschlandIE(InfoExtractor):
     _VALID_URL = r'https?://sportdeutschland\.tv/(?P<sport>[^/?#]+)/(?P<id>[^?#/]+)(?:$|[?#])'
-    _TEST = {
-        'url': 'http://sportdeutschland.tv/badminton/live-li-ning-badminton-weltmeisterschaft-2014-kopenhagen',
+    _TESTS = [{
+        'url': 'https://sportdeutschland.tv/badminton/re-live-deutsche-meisterschaften-2020-halbfinals?playlistId=0',
         'info_dict': {
-            'id': 'live-li-ning-badminton-weltmeisterschaft-2014-kopenhagen',
+            'id': 're-live-deutsche-meisterschaften-2020-halbfinals',
             'ext': 'mp4',
-            'title': 'LIVE: Li-Ning Badminton Weltmeisterschaft 2014 Kopenhagen',
-            'categories': ['Badminton'],
+            'title': 're:Re-live: Deutsche Meisterschaften 2020.*Halbfinals',
+            'categories': ['Badminton-Deutschland'],
             'view_count': int,
-            'thumbnail': 're:^https?://.*\.jpg',
-            'description': 're:^Die Badminton-WM 2014 aus Kopenhagen LIVE',
-            'timestamp': 1409043600,
-            'upload_date': '20140826',
+            'thumbnail': r're:^https?://.*\.(?:jpg|png)$',
+            'timestamp': int,
+            'upload_date': '20200201',
+            'description': 're:.*',  # meaningless description for THIS video
         },
-        'params': {
-            'skip_download': 'Live stream',
-        },
-    }
+    }]
 
     def _real_extract(self, url):
         mobj = re.match(self._VALID_URL, url)
         video_id = mobj.group('id')
         sport_id = mobj.group('sport')
 
-        api_url = 'http://splink.tv/api/permalinks/%s/%s' % (
+        api_url = 'https://proxy.vidibusdynamic.net/ssl/backend.sportdeutschland.tv/api/permalinks/%s/%s?access_token=true' % (
             sport_id, video_id)
-        req = compat_urllib_request.Request(api_url, headers={
+        req = sanitized_Request(api_url, headers={
             'Accept': 'application/vnd.vidibus.v2.html+json',
             'Referer': url,
         })
         data = self._download_json(req, video_id)
 
-        categories = list(data.get('section', {}).get('tags', {}).values())
         asset = data['asset']
+        categories = [data['section']['title']]
 
+        formats = []
         smil_url = asset['video']
-        m3u8_url = smil_url.replace('.smil', '.m3u8')
-        formats = self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4')
+        if '.smil' in smil_url:
+            m3u8_url = smil_url.replace('.smil', '.m3u8')
+            formats.extend(
+                self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4'))
+
+            smil_doc = self._download_xml(
+                smil_url, video_id, note='Downloading SMIL metadata')
+            base_url_el = smil_doc.find('./head/meta')
+            if base_url_el:
+                base_url = base_url_el.attrib['base']
+            formats.extend([{
+                'format_id': 'rmtp',
+                'url': base_url if base_url_el else n.attrib['src'],
+                'play_path': n.attrib['src'],
+                'ext': 'flv',
+                'preference': -100,
+                'format_note': 'Seems to fail at example stream',
+            } for n in smil_doc.findall('./body/video')])
+        else:
+            formats.append({'url': smil_url})
 
-        smil_doc = self._download_xml(
-            smil_url, video_id, note='Downloading SMIL metadata')
-        base_url = smil_doc.find('./head/meta').attrib['base']
-        formats.extend([{
-            'format_id': 'rmtp',
-            'url': base_url,
-            'play_path': n.attrib['src'],
-            'ext': 'flv',
-            'preference': -100,
-            'format_note': 'Seems to fail at example stream',
-        } for n in smil_doc.findall('./body/video')])
         self._sort_formats(formats)
 
         return {
@@ -69,9 +74,9 @@ class SportDeutschlandIE(InfoExtractor):
             'title': asset['title'],
             'thumbnail': asset.get('image'),
             'description': asset.get('teaser'),
+            'duration': asset.get('duration'),
             'categories': categories,
             'view_count': asset.get('views'),
-            'rtmp_live': asset['live'],
+            'rtmp_live': asset.get('live'),
             'timestamp': parse_iso8601(asset.get('date')),
         }
-