_find_jwplayer_data() returns dict or None

[youtube-dl] / youtube_dl / extractor / common.py
diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py

index 86aff331297af8ab2d30b85e48b6fde025d4fcbb..c2ca73ee1756519e90e19fc7512b1a77d834b2ee 100644 (file)
--- a/youtube_dl/extractor/common.py
+++ b/youtube_dl/extractor/common.py
@@ -390,10 +390,9 @@ class InfoExtractor(object):
  
          This method is used to initialize geo bypass mechanism based on faking
          X-Forwarded-For HTTP header. A random country from provided country list
-        is selected and a random IP brlonging to this country is generated. This
+        is selected and a random IP belonging to this country is generated. This
          IP will be passed as X-Forwarded-For HTTP header in all subsequent
          HTTP requests.
-        Method does nothing if no countries are specified.
  
          This method will be used for initial geo bypass mechanism initialization
          during the instance initialization with _GEO_COUNTRIES.
@@ -402,8 +401,6 @@ class InfoExtractor(object):
          information is not available beforehand (e.g. obtained during
          extraction) or due to some another reason.
          """
-        if not countries:
-            return
          if not self._x_forwarded_for_ip:
              country_code = self._downloader.params.get('geo_bypass_country', None)
              # If there is no explicit country for geo bypass specified and
@@ -418,7 +415,8 @@ class InfoExtractor(object):
                  self._x_forwarded_for_ip = GeoUtils.random_ipv4(country_code)
                  if self._downloader.params.get('verbose', False):
                      self._downloader.to_stdout(
-                        '[debug] Using fake %s IP as X-Forwarded-For.' % self._x_forwarded_for_ip)
+                        '[debug] Using fake IP %s (%s) as X-Forwarded-For.'
+                        % (self._x_forwarded_for_ip, country_code.upper()))
  
      def extract(self, url):
          """Extracts URL information and returns it in list of dicts."""
@@ -447,10 +445,12 @@ class InfoExtractor(object):
                  self._downloader.params.get('geo_bypass', True) and
                  not self._x_forwarded_for_ip and
                  countries):
-            self._x_forwarded_for_ip = GeoUtils.random_ipv4(random.choice(countries))
+            country_code = random.choice(countries)
+            self._x_forwarded_for_ip = GeoUtils.random_ipv4(country_code)
              if self._x_forwarded_for_ip:
                  self.report_warning(
-                    'Video is geo restricted. Retrying extraction with fake %s IP as X-Forwarded-For.' % self._x_forwarded_for_ip)
+                    'Video is geo restricted. Retrying extraction with fake IP %s (%s) as X-Forwarded-For.'
+                    % (self._x_forwarded_for_ip, country_code.upper()))
                  return True
          return False
  
@@ -2010,7 +2010,7 @@ class InfoExtractor(object):
                  })
          return formats
  
-    def _parse_html5_media_entries(self, base_url, webpage, video_id, m3u8_id=None, m3u8_entry_protocol='m3u8', mpd_id=None):
+    def _parse_html5_media_entries(self, base_url, webpage, video_id, m3u8_id=None, m3u8_entry_protocol='m3u8', mpd_id=None, preference=None):
          def absolute_url(video_url):
              return compat_urlparse.urljoin(base_url, video_url)
  
@@ -2032,7 +2032,8 @@ class InfoExtractor(object):
                  is_plain_url = False
                  formats = self._extract_m3u8_formats(
                      full_url, video_id, ext='mp4',
-                    entry_protocol=m3u8_entry_protocol, m3u8_id=m3u8_id)
+                    entry_protocol=m3u8_entry_protocol, m3u8_id=m3u8_id,
+                    preference=preference)
              elif ext == 'mpd':
                  is_plain_url = False
                  formats = self._extract_mpd_formats(
@@ -2160,18 +2161,24 @@ class InfoExtractor(object):
                      })
          return formats
  
-    @staticmethod
-    def _find_jwplayer_data(webpage):
+    def _find_jwplayer_data(self, webpage, video_id=None, transform_source=js_to_json):
          mobj = re.search(
              r'jwplayer\((?P<quote>[\'"])[^\'" ]+(?P=quote)\)\.setup\s*\((?P<options>[^)]+)\)',
              webpage)
          if mobj:
-            return mobj.group('options')
+            try:
+                jwplayer_data = self._parse_json(mobj.group('options'),
+                                                 video_id=video_id,
+                                                 transform_source=transform_source)
+            except ExtractorError:
+                pass
+            else:
+                if isinstance(jwplayer_data, dict):
+                    return jwplayer_data
  
      def _extract_jwplayer_data(self, webpage, video_id, *args, **kwargs):
-        jwplayer_data = self._parse_json(
-            self._find_jwplayer_data(webpage), video_id,
-            transform_source=js_to_json)
+        jwplayer_data = self._find_jwplayer_data(
+            webpage, video_id, transform_source=js_to_json)
          return self._parse_jwplayer_data(
              jwplayer_data, video_id, *args, **kwargs)