Use a wrapper around xml.etree.ElementTree.fromstring in python 2.x (#7178)

[youtube-dl] / youtube_dl / utils.py
diff --git a/youtube_dl/utils.py b/youtube_dl/utils.py

index 86c693358539451efc6fe4253382ff60427349c6..7d846d68085cdbf13e88f116b30b0ad9f2f21b0c 100644 (file)
--- a/youtube_dl/utils.py
+++ b/youtube_dl/utils.py
@@ -3,6 +3,7 @@
  
  from __future__ import unicode_literals
  
+import base64
  import calendar
  import codecs
  import contextlib
@@ -35,6 +36,7 @@ import zlib
  from .compat import (
      compat_basestring,
      compat_chr,
+    compat_etree_fromstring,
      compat_html_entities,
      compat_http_client,
      compat_kwargs,
@@ -1376,7 +1378,7 @@ def int_or_none(v, scale=1, default=None, get_attr=None, invscale=1):
      try:
          return int(v) * invscale // scale
      except ValueError:
-        pass
+        return default
  
  
  def str_or_none(v, default=None):
@@ -1392,7 +1394,12 @@ def str_to_int(int_str):
  
  
  def float_or_none(v, scale=1, invscale=1, default=None):
-    return default if v is None else (float(v) * invscale / scale)
+    if v is None:
+        return default
+    try:
+        return float(v) * invscale / scale
+    except ValueError:
+        return default
  
  
  def parse_duration(s):
@@ -1695,8 +1702,8 @@ def js_to_json(code):
          if v in ('true', 'false', 'null'):
              return v
          if v.startswith('"'):
-            return v
-        if v.startswith("'"):
+            v = re.sub(r"\\'", "'", v[1:-1])
+        elif v.startswith("'"):
              v = v[1:-1]
              v = re.sub(r"\\\\|\\'|\"", lambda m: {
                  '\\\\': '\\\\',
@@ -1790,6 +1797,10 @@ def urlhandle_detect_ext(url_handle):
      return mimetype2ext(getheader('Content-Type'))
  
  
+def encode_data_uri(data, mime_type):
+    return 'data:%s;base64,%s' % (mime_type, base64.b64encode(data).decode('ascii'))
+
+
  def age_restricted(content_limit, age_limit):
      """ Returns True iff the content should be blocked """
  
@@ -1964,7 +1975,7 @@ def dfxp2srt(dfxp_data):
  
          return out
  
-    dfxp = xml.etree.ElementTree.fromstring(dfxp_data.encode('utf-8'))
+    dfxp = compat_etree_fromstring(dfxp_data.encode('utf-8'))
      out = []
      paras = dfxp.findall(_x('.//ttml:p')) or dfxp.findall(_x('.//ttaf1:p')) or dfxp.findall('.//p')