[ard] Add alive tests

[youtube-dl] / youtube_dl / extractor / ard.py
diff --git a/youtube_dl/extractor/ard.py b/youtube_dl/extractor/ard.py

index 3f248b14728ab3655a2e17f7b38a95184042d770..8d3dd78a3ee16895f267775f8815321af49f9a91 100644 (file)
--- a/youtube_dl/extractor/ard.py
+++ b/youtube_dl/extractor/ard.py
@@ -5,6 +5,7 @@ import re
  
  from .common import InfoExtractor
  from .generic import GenericIE
+from ..compat import compat_str
  from ..utils import (
      determine_ext,
      ExtractorError,
@@ -23,6 +24,20 @@ class ARDMediathekIE(InfoExtractor):
      _VALID_URL = r'^https?://(?:(?:www\.)?ardmediathek\.de|mediathek\.(?:daserste|rbb-online)\.de)/(?:.*/)(?P<video_id>[0-9]+|[^0-9][^/\?]+)[^/\?]*(?:\?.*)?'
  
      _TESTS = [{
+        'url': 'http://www.ardmediathek.de/tv/S%C3%9CDLICHT/Was-ist-die-Kunst-der-Zukunft-liebe-Ann/BR-Fernsehen/Video?bcastId=34633636&documentId=44726822',
+        'info_dict': {
+            'id': '44726822',
+            'ext': 'mp4',
+            'title': 'Was ist die Kunst der Zukunft, liebe Anna McCarthy?',
+            'description': 'md5:4ada28b3e3b5df01647310e41f3a62f5',
+            'duration': 1740,
+        },
+        'params': {
+            # m3u8 download
+            'skip_download': True,
+        }
+    },
+    {
          'url': 'http://www.ardmediathek.de/tv/Dokumentation-und-Reportage/Ich-liebe-das-Leben-trotzdem/rbb-Fernsehen/Video?documentId=29582122&bcastId=3822114',
          'info_dict': {
              'id': '29582122',
@@ -126,6 +141,8 @@ class ARDMediathekIE(InfoExtractor):
                  quality = stream.get('_quality')
                  server = stream.get('_server')
                  for stream_url in stream_urls:
+                    if not isinstance(stream_url, compat_str) or '//' not in stream_url:
+                        continue
                      ext = determine_ext(stream_url)
                      if quality != 'auto' and ext in ('f4m', 'm3u8'):
                          continue
@@ -146,13 +163,11 @@ class ARDMediathekIE(InfoExtractor):
                                  'play_path': stream_url,
                                  'format_id': 'a%s-rtmp-%s' % (num, quality),
                              }
-                        elif stream_url.startswith('http'):
+                        else:
                              f = {
                                  'url': stream_url,
                                  'format_id': 'a%s-%s-%s' % (num, ext, quality)
                              }
-                        else:
-                            continue
                          m = re.search(r'_(?P<width>\d+)x(?P<height>\d+)\.mp4$', stream_url)
                          if m:
                              f.update({
@@ -195,7 +210,7 @@ class ARDMediathekIE(InfoExtractor):
  
          title = self._html_search_regex(
              [r'<h1(?:\s+class="boxTopHeadline")?>(.*?)</h1>',
-             r'<meta name="dcterms.title" content="(.*?)"/>',
+             r'<meta name="dcterms\.title" content="(.*?)"/>',
               r'<h4 class="headline">(.*?)</h4>'],
              webpage, 'title')
          description = self._html_search_meta(
@@ -251,7 +266,20 @@ class ARDMediathekIE(InfoExtractor):
  
  class ARDIE(InfoExtractor):
      _VALID_URL = r'(?P<mainurl>https?://(www\.)?daserste\.de/[^?#]+/videos/(?P<display_id>[^/?#]+)-(?P<id>[0-9]+))\.html'
-    _TEST = {
+    _TESTS = [{
+        'url': 'http://www.daserste.de/information/talk/maischberger/videos/das-groko-drama-zerlegen-sich-die-volksparteien-video-102.html',
+        'md5': '8e4ec85f31be7c7fc08a26cdbc5a1f49',
+        'info_dict': {
+            'display_id': 'das-groko-drama-zerlegen-sich-die-volksparteien-video',
+            'id': '102',
+            'ext': 'mp4',
+            'duration': 4435.0,
+            'title': 'Das GroKo-Drama: Zerlegen sich die Volksparteien?',
+            'upload_date': '20180214',
+            'thumbnail': r're:^https?://.*\.jpg$',
+        },
+    },
+    {
          'url': 'http://www.daserste.de/information/reportage-dokumentation/dokus/videos/die-story-im-ersten-mission-unter-falscher-flagge-100.html',
          'md5': 'd216c3a86493f9322545e045ddc3eb35',
          'info_dict': {
@@ -264,7 +292,7 @@ class ARDIE(InfoExtractor):
              'thumbnail': r're:^https?://.*\.jpg$',
          },
          'skip': 'HTTP Error 404: Not Found',
-    }
+    }]
  
      def _real_extract(self, url):
          mobj = re.match(self._VALID_URL, url)