[spiegel] Use generalized formats pre-testing

[youtube-dl] / youtube_dl / extractor / spiegel.py
diff --git a/youtube_dl/extractor/spiegel.py b/youtube_dl/extractor/spiegel.py

index 9586a7da2226ff822992cb21bc1698952c14b29e..b868241d50a23cbfa7289f6d2affb46e224696e3 100644 (file)
--- a/youtube_dl/extractor/spiegel.py
+++ b/youtube_dl/extractor/spiegel.py
@@ -5,6 +5,7 @@ import re
  
  from .common import InfoExtractor
  from ..compat import compat_urlparse
+from .spiegeltv import SpiegeltvIE
  
  
  class SpiegelIE(InfoExtractor):
@@ -42,7 +43,11 @@ class SpiegelIE(InfoExtractor):
  
      def _real_extract(self, url):
          video_id = self._match_id(url)
-        webpage = self._download_webpage(url, video_id)
+        webpage, handle = self._download_webpage_handle(url, video_id)
+
+        # 302 to spiegel.tv, like http://www.spiegel.de/video/der-film-zum-wochenende-die-wahrheit-ueber-maenner-video-99003272.html
+        if SpiegeltvIE.suitable(handle.geturl()):
+            return self.url_result(handle.geturl(), 'Spiegeltv')
  
          title = re.sub(r'\s+', ' ', self._html_search_regex(
              r'(?s)<(?:h1|div) class="module-title"[^>]*>(.*?)</(?:h1|div)>',
@@ -55,23 +60,24 @@ class SpiegelIE(InfoExtractor):
          xml_url = base_url + video_id + '.xml'
          idoc = self._download_xml(xml_url, video_id)
  
-        formats = [
-            {
-                'format_id': n.tag.rpartition('type')[2],
-                'url': base_url + n.find('./filename').text,
-                'width': int(n.find('./width').text),
-                'height': int(n.find('./height').text),
-                'abr': int(n.find('./audiobitrate').text),
-                'vbr': int(n.find('./videobitrate').text),
-                'vcodec': n.find('./codec').text,
-                'acodec': 'MP4A',
-            }
-            for n in list(idoc)
-            # Blacklist type 6, it's extremely LQ and not available on the same server
-            if n.tag.startswith('type') and n.tag != 'type6'
-        ]
+        formats = []
+        for n in list(idoc):
+            if n.tag.startswith('type') and n.tag != 'type6':
+                format_id = n.tag.rpartition('type')[2]
+                video_url = base_url + n.find('./filename').text
+                formats.append({
+                    'format_id': format_id,
+                    'url': video_url,
+                    'width': int(n.find('./width').text),
+                    'height': int(n.find('./height').text),
+                    'abr': int(n.find('./audiobitrate').text),
+                    'vbr': int(n.find('./videobitrate').text),
+                    'vcodec': n.find('./codec').text,
+                    'acodec': 'MP4A',
+                })
          duration = float(idoc[0].findall('./duration')[0].text)
  
+        self._check_formats(formats, video_id)
          self._sort_formats(formats)
  
          return {