Add display_id field

[youtube-dl] / youtube_dl / extractor / common.py
diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py

index f7478d4598e8f15ea802ec9451aff53ce452fe7a..080c9bdfada0440201a85027ddbb34772d09b28f 100644 (file)
--- a/youtube_dl/extractor/common.py
+++ b/youtube_dl/extractor/common.py
@@ -88,6 +88,10 @@ class InfoExtractor(object):
  
      The following fields are optional:
  
  
      The following fields are optional:
  
+    display_id      An alternative identifier for the video, not necessarily
+                    unique, but available before title. Typically, id is
+                    something like "4234987", title "Dancing naked mole rats",
+                    and display_id "dancing-naked-mole-rats"
      thumbnails:     A list of dictionaries (with the entries "resolution" and
                      "url") for the varying thumbnails
      thumbnail:      Full URL to a video thumbnail image.
      thumbnails:     A list of dictionaries (with the entries "resolution" and
                      "url") for the varying thumbnails
      thumbnail:      Full URL to a video thumbnail image.
@@ -271,8 +275,11 @@ class InfoExtractor(object):
  
      def _download_json(self, url_or_request, video_id,
                         note=u'Downloading JSON metadata',
  
      def _download_json(self, url_or_request, video_id,
                         note=u'Downloading JSON metadata',
-                       errnote=u'Unable to download JSON metadata'):
+                       errnote=u'Unable to download JSON metadata',
+                       transform_source=None):
          json_string = self._download_webpage(url_or_request, video_id, note, errnote)
          json_string = self._download_webpage(url_or_request, video_id, note, errnote)
+        if transform_source:
+            json_string = transform_source(json_string)
          try:
              return json.loads(json_string)
          except ValueError as ve:
          try:
              return json.loads(json_string)
          except ValueError as ve:
@@ -399,7 +406,7 @@ class InfoExtractor(object):
      # Helper functions for extracting OpenGraph info
      @staticmethod
      def _og_regexes(prop):
      # Helper functions for extracting OpenGraph info
      @staticmethod
      def _og_regexes(prop):
-        content_re = r'content=(?:"([^>]+?)"|\'(.+?)\')'
+        content_re = r'content=(?:"([^>]+?)"|\'([^>]+?)\')'
          property_re = r'(?:name|property)=[\'"]og:%s[\'"]' % re.escape(prop)
          template = r'<meta[^>]+?%s[^>]+?%s'
          return [
          property_re = r'(?:name|property)=[\'"]og:%s[\'"]' % re.escape(prop)
          template = r'<meta[^>]+?%s[^>]+?%s'
          return [
@@ -465,6 +472,10 @@ class InfoExtractor(object):
          }
          return RATING_TABLE.get(rating.lower(), None)
  
          }
          return RATING_TABLE.get(rating.lower(), None)
  
+    def _twitter_search_player(self, html):
+        return self._html_search_meta('twitter:player', html,
+            'twitter card player')
+
      def _sort_formats(self, formats):
          if not formats:
              raise ExtractorError(u'No video formats found')
      def _sort_formats(self, formats):
          if not formats:
              raise ExtractorError(u'No video formats found')