Merge branch 'pr-twitter' of https://github.com/atomicdryad/youtube-dl into atomicdry...

[youtube-dl] / youtube_dl / YoutubeDL.py
diff --git a/youtube_dl/YoutubeDL.py b/youtube_dl/YoutubeDL.py

index 1446b3254f0085cf933d368b7109723af3720fba..adf70d658b2d24b6b526869da9a8b0005cca5afb 100755 (executable)
--- a/youtube_dl/YoutubeDL.py
+++ b/youtube_dl/YoutubeDL.py
@@ -28,7 +28,6 @@ if os.name == 'nt':
      import ctypes
  
  from .compat import (
-    compat_basestring,
      compat_cookiejar,
      compat_expanduser,
      compat_get_terminal_size,
@@ -40,7 +39,6 @@ from .compat import (
      compat_urllib_request,
  )
  from .utils import (
-    escape_url,
      ContentTooShortError,
      date_from_str,
      DateRange,
@@ -51,7 +49,6 @@ from .utils import (
      ExtractorError,
      format_bytes,
      formatSeconds,
-    HEADRequest,
      locked_file,
      make_HTTPS_handler,
      MaxDownloadsReached,
@@ -72,6 +69,7 @@ from .utils import (
      version_tuple,
      write_json_file,
      write_string,
+    YoutubeDLCookieProcessor,
      YoutubeDLHandler,
      prepend_extension,
      replace_extension,
@@ -287,7 +285,11 @@ class YoutubeDL(object):
          self._num_downloads = 0
          self._screen_file = [sys.stdout, sys.stderr][params.get('logtostderr', False)]
          self._err_file = sys.stderr
-        self.params = params
+        self.params = {
+            # Default parameters
+            'nocheckcertificate': False,
+        }
+        self.params.update(params)
          self.cache = Cache(self)
  
          if params.get('bidi_workaround', False):
@@ -1230,13 +1232,20 @@ class YoutubeDL(object):
              except (ValueError, OverflowError, OSError):
                  pass
  
+        subtitles = info_dict.get('subtitles')
+        if subtitles:
+            for _, subtitle in subtitles.items():
+                for subtitle_format in subtitle:
+                    if 'ext' not in subtitle_format:
+                        subtitle_format['ext'] = determine_ext(subtitle_format['url']).lower()
+
          if self.params.get('listsubtitles', False):
              if 'automatic_captions' in info_dict:
                  self.list_subtitles(info_dict['id'], info_dict.get('automatic_captions'), 'automatic captions')
-            self.list_subtitles(info_dict['id'], info_dict.get('subtitles'), 'subtitles')
+            self.list_subtitles(info_dict['id'], subtitles, 'subtitles')
              return
          info_dict['requested_subtitles'] = self.process_subtitles(
-            info_dict['id'], info_dict.get('subtitles'),
+            info_dict['id'], subtitles,
              info_dict.get('automatic_captions'))
  
          # We now pick which formats have to be downloaded
@@ -1860,27 +1869,6 @@ class YoutubeDL(object):
  
      def urlopen(self, req):
          """ Start an HTTP download """
-
-        # According to RFC 3986, URLs can not contain non-ASCII characters, however this is not
-        # always respected by websites, some tend to give out URLs with non percent-encoded
-        # non-ASCII characters (see telemb.py, ard.py [#3412])
-        # urllib chokes on URLs with non-ASCII characters (see http://bugs.python.org/issue3991)
-        # To work around aforementioned issue we will replace request's original URL with
-        # percent-encoded one
-        req_is_string = isinstance(req, compat_basestring)
-        url = req if req_is_string else req.get_full_url()
-        url_escaped = escape_url(url)
-
-        # Substitute URL if any change after escaping
-        if url != url_escaped:
-            if req_is_string:
-                req = url_escaped
-            else:
-                req_type = HEADRequest if req.get_method() == 'HEAD' else compat_urllib_request.Request
-                req = req_type(
-                    url_escaped, data=req.data, headers=req.headers,
-                    origin_req_host=req.origin_req_host, unverifiable=req.unverifiable)
-
          return self._opener.open(req, timeout=self._socket_timeout)
  
      def print_debug_header(self):
@@ -1963,8 +1951,7 @@ class YoutubeDL(object):
              if os.access(opts_cookiefile, os.R_OK):
                  self.cookiejar.load()
  
-        cookie_processor = compat_urllib_request.HTTPCookieProcessor(
-            self.cookiejar)
+        cookie_processor = YoutubeDLCookieProcessor(self.cookiejar)
          if opts_proxy is not None:
              if opts_proxy == '':
                  proxies = {}
@@ -2033,7 +2020,7 @@ class YoutubeDL(object):
                                 (info_dict['extractor'], info_dict['id'], thumb_display_id))
                  try:
                      uf = self.urlopen(t['url'])
-                    with open(thumb_filename, 'wb') as thumbf:
+                    with open(encodeFilename(thumb_filename), 'wb') as thumbf:
                          shutil.copyfileobj(uf, thumbf)
                      self.to_screen('[%s] %s: Writing thumbnail %sto: %s' %
                                     (info_dict['extractor'], info_dict['id'], thumb_display_id, thumb_filename))