[utils] Escape all HTML entities written in hexadecimal form
[youtube-dl] / youtube_dl / utils.py
index 472d4df41fda2cb1ffd0392cc4da0f4bdcc2a48a..245d623d86df365a562fb395bc792b42f68634eb 100644 (file)
@@ -348,7 +348,7 @@ def _htmlentity_transform(entity):
     if entity in compat_html_entities.name2codepoint:
         return compat_chr(compat_html_entities.name2codepoint[entity])
 
-    mobj = re.match(r'#(x?[0-9]+)', entity)
+    mobj = re.match(r'#(x[0-9a-fA-F]+|[0-9]+)', entity)
     if mobj is not None:
         numstr = mobj.group(1)
         if numstr.startswith('x'):