[generic] Add support for LazyYT embeds (Fixes #4306)

[youtube-dl] / youtube_dl / extractor / generic.py
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py

index c7a824c29b15187becb0bb9758ee94348f2309da..6a95e2952a63a2960d795a6c6b538c9d4b6fe2b6 100644 (file)
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -445,6 +445,14 @@ class GenericIE(InfoExtractor):
                  'title': 'Rosetta #CometLanding webcast HL 10',
              }
          },
+        # LazyYT
+        {
+            'url': 'http://discourse.ubuntu.com/t/unity-8-desktop-mode-windows-on-mir/1986',
+            'info_dict': {
+                'title': 'Unity 8 desktop-mode windows on Mir! - Ubuntu Discourse',
+            },
+            'playlist_mincount': 2,
+        }
      ]
  
      def report_following_redirect(self, new_url):
@@ -537,9 +545,9 @@ class GenericIE(InfoExtractor):
  
              if default_search in ('error', 'fixup_error'):
                  raise ExtractorError(
-                    ('%r is not a valid URL. '
-                     'Set --default-search "ytsearch" (or run  youtube-dl "ytsearch:%s" ) to search YouTube'
-                    ) % (url, url), expected=True)
+                    '%r is not a valid URL. '
+                    'Set --default-search "ytsearch" (or run  youtube-dl "ytsearch:%s" ) to search YouTube'
+                    % (url, url), expected=True)
              else:
                  if ':' not in default_search:
                      default_search += ':'
@@ -702,6 +710,12 @@ class GenericIE(InfoExtractor):
              return _playlist_from_matches(
                  matches, lambda m: unescapeHTML(m[1]))
  
+        # Look for lazyYT YouTube embed
+        matches = re.findall(
+            r'class="lazyYT" data-youtube-id="([^"]+)"', webpage)
+        if matches:
+            return _playlist_from_matches(matches, lambda m: unescapeHTML(m))
+
          # Look for embedded Dailymotion player
          matches = re.findall(
              r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?dailymotion\.com/embed/video/.+?)\1', webpage)
@@ -733,7 +747,7 @@ class GenericIE(InfoExtractor):
                  'title': video_title,
                  'id': video_id,
              }
-            
+
          match = re.search(r'(?:id=["\']wistia_|data-wistia-?id=["\']|Wistia\.embed\(["\'])(?P<id>[^"\']+)', webpage)
          if match:
              return {
@@ -748,7 +762,7 @@ class GenericIE(InfoExtractor):
          # Look for embedded blip.tv player
          mobj = re.search(r'<meta\s[^>]*https?://api\.blip\.tv/\w+/redirect/\w+/(\d+)', webpage)
          if mobj:
-            return self.url_result('http://blip.tv/a/a-'+mobj.group(1), 'BlipTV')
+            return self.url_result('http://blip.tv/a/a-' + mobj.group(1), 'BlipTV')
          mobj = re.search(r'<(?:iframe|embed|object)\s[^>]*(https?://(?:\w+\.)?blip\.tv/(?:play/|api\.swf#)[a-zA-Z0-9_]+)', webpage)
          if mobj:
              return self.url_result(mobj.group(1), 'BlipTV')
@@ -784,7 +798,7 @@ class GenericIE(InfoExtractor):
  
          # Look for Ooyala videos
          mobj = (re.search(r'player.ooyala.com/[^"?]+\?[^"]*?(?:embedCode|ec)=(?P<ec>[^"&]+)', webpage) or
-             re.search(r'OO.Player.create\([\'"].*?[\'"],\s*[\'"](?P<ec>.{32})[\'"]', webpage))
+                re.search(r'OO.Player.create\([\'"].*?[\'"],\s*[\'"](?P<ec>.{32})[\'"]', webpage))
          if mobj is not None:
              return OoyalaIE._build_url_result(mobj.group('ec'))
  
@@ -1025,4 +1039,3 @@ class GenericIE(InfoExtractor):
                  '_type': 'playlist',
                  'entries': entries,
              }
-