lazy extractors: specify the encoding

[youtube-dl] / youtube_dl / YoutubeDL.py
diff --git a/youtube_dl/YoutubeDL.py b/youtube_dl/YoutubeDL.py

index 53a36c145dc775b876cca41e732b7f7b312ec0a1..f18a8e840553528703e79cf3dd2415173a568d0e 100755 (executable)
--- a/youtube_dl/YoutubeDL.py
+++ b/youtube_dl/YoutubeDL.py
@@ -82,7 +82,7 @@ from .utils import (
      YoutubeDLHandler,
  )
  from .cache import Cache
-from .extractor import get_info_extractor, gen_extractors
+from .extractor import get_info_extractor, gen_extractor_classes
  from .downloader import get_suitable_downloader
  from .downloader.rtmp import rtmpdump_version
  from .postprocessor import (
@@ -378,8 +378,9 @@ class YoutubeDL(object):
      def add_info_extractor(self, ie):
          """Add an InfoExtractor object to the end of the list."""
          self._ies.append(ie)
-        self._ies_instances[ie.ie_key()] = ie
-        ie.set_downloader(self)
+        if not isinstance(ie, type):
+            self._ies_instances[ie.ie_key()] = ie
+            ie.set_downloader(self)
  
      def get_info_extractor(self, ie_key):
          """
@@ -397,7 +398,7 @@ class YoutubeDL(object):
          """
          Add the InfoExtractors returned by gen_extractors to the end of the list
          """
-        for ie in gen_extractors():
+        for ie in gen_extractor_classes():
              self.add_info_extractor(ie)
  
      def add_post_processor(self, pp):
@@ -661,6 +662,7 @@ class YoutubeDL(object):
              if not ie.suitable(url):
                  continue
  
+            ie = self.get_info_extractor(ie.ie_key())
              if not ie.working():
                  self.report_warning('The program functionality for this site has been marked as broken, '
                                      'and will probably not work.')
@@ -1240,7 +1242,10 @@ class YoutubeDL(object):
              self.list_thumbnails(info_dict)
              return
  
-        if thumbnails and 'thumbnail' not in info_dict:
+        thumbnail = info_dict.get('thumbnail')
+        if thumbnail:
+            info_dict['thumbnail'] = sanitize_url(thumbnail)
+        elif thumbnails:
              info_dict['thumbnail'] = thumbnails[-1]['url']
  
          if 'display_id' not in info_dict and 'id' in info_dict:
@@ -1265,7 +1270,8 @@ class YoutubeDL(object):
          if subtitles:
              for _, subtitle in subtitles.items():
                  for subtitle_format in subtitle:
-                    subtitle_format['url'] = sanitize_url(subtitle_format['url'])
+                    if subtitle_format.get('url'):
+                        subtitle_format['url'] = sanitize_url(subtitle_format['url'])
                      if 'ext' not in subtitle_format:
                          subtitle_format['ext'] = determine_ext(subtitle_format['url']).lower()