[compat] Add compat_urllib_request_DataHandler

[youtube-dl] / youtube_dl / compat.py
diff --git a/youtube_dl/compat.py b/youtube_dl/compat.py

index e950a4688f023776093f950921123b8e75cc8c7a..d103ab9adf73ee664a0639e33191ef2ff89431ce 100644 (file)
--- a/youtube_dl/compat.py
+++ b/youtube_dl/compat.py
@@ -1,10 +1,14 @@
  from __future__ import unicode_literals
  
+import binascii
  import collections
+import email
  import getpass
+import io
  import optparse
  import os
  import re
+import shlex
  import shutil
  import socket
  import subprocess
@@ -37,11 +41,21 @@ try:
  except ImportError:  # Python 2
      import urlparse as compat_urlparse
  
+try:
+    import urllib.response as compat_urllib_response
+except ImportError:  # Python 2
+    import urllib as compat_urllib_response
+
  try:
      import http.cookiejar as compat_cookiejar
  except ImportError:  # Python 2
      import cookielib as compat_cookiejar
  
+try:
+    import http.cookies as compat_cookies
+except ImportError:  # Python 2
+    import Cookie as compat_cookies
+
  try:
      import html.entities as compat_html_entities
  except ImportError:  # Python 2
@@ -74,11 +88,19 @@ try:
  except ImportError:
      import BaseHTTPServer as compat_http_server
  
+try:
+    compat_str = unicode  # Python 2
+except NameError:
+    compat_str = str
+
  try:
      from urllib.parse import unquote_to_bytes as compat_urllib_parse_unquote_to_bytes
      from urllib.parse import unquote as compat_urllib_parse_unquote
      from urllib.parse import unquote_plus as compat_urllib_parse_unquote_plus
  except ImportError:  # Python 2
+    _asciire = (compat_urllib_parse._asciire if hasattr(compat_urllib_parse, '_asciire')
+                else re.compile('([\x00-\x7f]+)'))
+
      # HACK: The following are the correct unquote_to_bytes, unquote and unquote_plus
      # implementations from cpython 3.4.3's stdlib. Python 2's version
      # is apparently broken (see https://github.com/rg3/youtube-dl/pull/6244)
@@ -91,7 +113,7 @@ except ImportError:  # Python 2
              # Is it a string-like object?
              string.split
              return b''
-        if isinstance(string, unicode):
+        if isinstance(string, compat_str):
              string = string.encode('utf-8')
          bits = string.split(b'%')
          if len(bits) == 1:
@@ -124,7 +146,7 @@ except ImportError:  # Python 2
              encoding = 'utf-8'
          if errors is None:
              errors = 'replace'
-        bits = compat_urllib_parse._asciire.split(string)
+        bits = _asciire.split(string)
          res = [bits[0]]
          append = res.append
          for i in range(1, len(bits), 2):
@@ -142,9 +164,38 @@ except ImportError:  # Python 2
          return compat_urllib_parse_unquote(string, encoding, errors)
  
  try:
-    compat_str = unicode  # Python 2
-except NameError:
-    compat_str = str
+    from urllib.request import DataHandler as compat_urllib_request_DataHandler
+except ImportError:  # Python < 3.4
+    # Ported from CPython 98774:1733b3bd46db, Lib/urllib/request.py
+    class compat_urllib_request_DataHandler(compat_urllib_request.BaseHandler):
+        def data_open(self, req):
+            # data URLs as specified in RFC 2397.
+            #
+            # ignores POSTed data
+            #
+            # syntax:
+            # dataurl   := "data:" [ mediatype ] [ ";base64" ] "," data
+            # mediatype := [ type "/" subtype ] *( ";" parameter )
+            # data      := *urlchar
+            # parameter := attribute "=" value
+            url = req.get_full_url()
+
+            scheme, data = url.split(":", 1)
+            mediatype, data = data.split(",", 1)
+
+            # even base64 encoded data URLs might be quoted so unquote in any case:
+            data = compat_urllib_parse_unquote_to_bytes(data)
+            if mediatype.endswith(";base64"):
+                data = binascii.a2b_base64(data)
+                mediatype = mediatype[:-7]
+
+            if not mediatype:
+                mediatype = "text/plain;charset=US-ASCII"
+
+            headers = email.message_from_string(
+                "Content-type: %s\nContent-length: %d\n" % (mediatype, len(data)))
+
+            return compat_urllib_response.addinfourl(io.BytesIO(data), headers, url)
  
  try:
      compat_basestring = basestring  # Python 2
@@ -219,6 +270,17 @@ except ImportError:  # Python < 3.3
              return "'" + s.replace("'", "'\"'\"'") + "'"
  
  
+if sys.version_info >= (2, 7, 3):
+    compat_shlex_split = shlex.split
+else:
+    # Working around shlex issue with unicode strings on some python 2
+    # versions (see http://bugs.python.org/issue1548891)
+    def compat_shlex_split(s, comments=False, posix=True):
+        if isinstance(s, compat_str):
+            s = s.encode('utf-8')
+        return shlex.split(s, comments, posix)
+
+
  def compat_ord(c):
      if type(c) is int:
          return c
@@ -396,26 +458,32 @@ if hasattr(shutil, 'get_terminal_size'):  # Python >= 3.3
  else:
      _terminal_size = collections.namedtuple('terminal_size', ['columns', 'lines'])
  
-    def compat_get_terminal_size():
-        columns = compat_getenv('COLUMNS', None)
+    def compat_get_terminal_size(fallback=(80, 24)):
+        columns = compat_getenv('COLUMNS')
          if columns:
              columns = int(columns)
          else:
              columns = None
-        lines = compat_getenv('LINES', None)
+        lines = compat_getenv('LINES')
          if lines:
              lines = int(lines)
          else:
              lines = None
  
-        try:
-            sp = subprocess.Popen(
-                ['stty', 'size'],
-                stdout=subprocess.PIPE, stderr=subprocess.PIPE)
-            out, err = sp.communicate()
-            lines, columns = map(int, out.split())
-        except Exception:
-            pass
+        if columns is None or lines is None or columns <= 0 or lines <= 0:
+            try:
+                sp = subprocess.Popen(
+                    ['stty', 'size'],
+                    stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+                out, err = sp.communicate()
+                _lines, _columns = map(int, out.split())
+            except Exception:
+                _columns, _lines = _terminal_size(*fallback)
+
+            if columns is None or columns <= 0:
+                columns = _columns
+            if lines is None or lines <= 0:
+                lines = _lines
          return _terminal_size(columns, lines)
  
  try:
@@ -428,11 +496,17 @@ except TypeError:  # Python 2.6
              yield n
              n += step
  
+if sys.version_info >= (3, 0):
+    from tokenize import tokenize as compat_tokenize_tokenize
+else:
+    from tokenize import generate_tokens as compat_tokenize_tokenize
+
  __all__ = [
      'compat_HTTPError',
      'compat_basestring',
      'compat_chr',
      'compat_cookiejar',
+    'compat_cookies',
      'compat_expanduser',
      'compat_get_terminal_size',
      'compat_getenv',
@@ -445,9 +519,11 @@ __all__ = [
      'compat_ord',
      'compat_parse_qs',
      'compat_print',
+    'compat_shlex_split',
      'compat_socket_create_connection',
      'compat_str',
      'compat_subprocess_get_DEVNULL',
+    'compat_tokenize_tokenize',
      'compat_urllib_error',
      'compat_urllib_parse',
      'compat_urllib_parse_unquote',
@@ -455,6 +531,8 @@ __all__ = [
      'compat_urllib_parse_unquote_to_bytes',
      'compat_urllib_parse_urlparse',
      'compat_urllib_request',
+    'compat_urllib_request_DataHandler',
+    'compat_urllib_response',
      'compat_urlparse',
      'compat_urlretrieve',
      'compat_xml_parse_error',