[wistia] Add support for multiple generic embeds (closes #8347, closes #11385)

author Sergey M․ <dstftw@gmail.com>

Sat, 22 Feb 2020 23:47:11 +0000 (06:47 +0700)

committer Sergey M․ <dstftw@gmail.com>

Sat, 22 Feb 2020 23:47:11 +0000 (06:47 +0700)
author Sergey M․ <dstftw@gmail.com>
Sat, 22 Feb 2020 23:47:11 +0000 (06:47 +0700)
committer Sergey M․ <dstftw@gmail.com>
Sat, 22 Feb 2020 23:47:11 +0000 (06:47 +0700)
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py

index 3c002472f795b3600c8f721e76c446f85f3f9bf5..04c026984b12086085ca094673d1e84bf4419745 100644 (file)
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -2537,14 +2537,15 @@ class GenericIE(InfoExtractor):
                  dailymail_urls, video_id, video_title, ie=DailyMailIE.ie_key())
  
          # Look for embedded Wistia player
-        wistia_url = WistiaIE._extract_url(webpage)
-        if wistia_url:
-            return {
-                '_type': 'url_transparent',
-                'url': self._proto_relative_url(wistia_url),
-                'ie_key': WistiaIE.ie_key(),
-                'uploader': video_uploader,
-            }
+        wistia_urls = WistiaIE._extract_urls(webpage)
+        if wistia_urls:
+            playlist = self.playlist_from_matches(wistia_urls, video_id, video_title, ie=WistiaIE.ie_key())
+            for entry in playlist['entries']:
+                entry.update({
+                    '_type': 'url_transparent',
+                    'uploader': video_uploader,
+                })
+            return playlist
  
          # Look for SVT player
          svt_url = SVTIE._extract_url(webpage)
diff --git a/youtube_dl/extractor/wistia.py b/youtube_dl/extractor/wistia.py

index 085514d470bcee6d5719a9260ceefdfc3a9cdb17..168e5e90152b44d76dcbbbeb1b274db5dcbf5827 100644 (file)
--- a/youtube_dl/extractor/wistia.py
+++ b/youtube_dl/extractor/wistia.py
@@ -45,22 +45,23 @@ class WistiaIE(InfoExtractor):
      # https://wistia.com/support/embed-and-share/video-on-your-website
      @staticmethod
      def _extract_url(webpage):
-        match = re.search(
-            r'<(?:meta[^>]+?content|(?:iframe|script)[^>]+?src)=["\'](?P<url>(?:https?:)?//(?:fast\.)?wistia\.(?:net|com)/embed/(?:iframe|medias)/[a-z0-9]{10})', webpage)
-        if match:
-            return unescapeHTML(match.group('url'))
+        urls = WistiaIE._extract_urls(webpage)
+        return urls[0] if urls else None
  
-        match = re.search(
-            r'''(?sx)
-                <script[^>]+src=(["'])(?:https?:)?//fast\.wistia\.com/assets/external/E-v1\.js\1[^>]*>.*?
-                <div[^>]+class=(["']).*?\bwistia_async_(?P<id>[a-z0-9]{10})\b.*?\2
-            ''', webpage)
-        if match:
-            return 'wistia:%s' % match.group('id')
-
-        match = re.search(r'(?:data-wistia-?id=["\']|Wistia\.embed\(["\']|id=["\']wistia_)(?P<id>[a-z0-9]{10})', webpage)
-        if match:
-            return 'wistia:%s' % match.group('id')
+    @staticmethod
+    def _extract_urls(webpage):
+        urls = []
+        for match in re.finditer(
+                r'<(?:meta[^>]+?content|(?:iframe|script)[^>]+?src)=["\'](?P<url>(?:https?:)?//(?:fast\.)?wistia\.(?:net|com)/embed/(?:iframe|medias)/[a-z0-9]{10})', webpage):
+            urls.append(unescapeHTML(match.group('url')))
+        for match in re.finditer(
+                r'''(?sx)
+                    <div[^>]+class=(["']).*?\bwistia_async_(?P<id>[a-z0-9]{10})\b.*?\2
+                ''', webpage):
+            urls.append('wistia:%s' % match.group('id'))
+        for match in re.finditer(r'(?:data-wistia-?id=["\']|Wistia\.embed\(["\']|id=["\']wistia_)(?P<id>[a-z0-9]{10})', webpage):
+            urls.append('wistia:%s' % match.group('id'))
+        return urls
  
      def _real_extract(self, url):
          video_id = self._match_id(url)
author	Sergey M․ <dstftw@gmail.com>
	Sat, 22 Feb 2020 23:47:11 +0000 (06:47 +0700)
committer	Sergey M․ <dstftw@gmail.com>
	Sat, 22 Feb 2020 23:47:11 +0000 (06:47 +0700)
youtube_dl/extractor/generic.py		patch \| blob \| history
youtube_dl/extractor/wistia.py		patch \| blob \| history