[utils] Handle HTMLParseError in extract_attributes (closes #13349)

[youtube-dl] / test / test_utils.py
diff --git a/test/test_utils.py b/test/test_utils.py

index f31559e71f60f9474aa51ae36dbbc3e24affd5ce..2b93b360477f857b8fa693450d3c5375db5663cc 100644 (file)
--- a/test/test_utils.py
+++ b/test/test_utils.py
@@ -340,6 +340,7 @@ class TestUtil(unittest.TestCase):
          self.assertEqual(unified_timestamp('May 16, 2016 11:15 PM'), 1463440500)
          self.assertEqual(unified_timestamp('Feb 7, 2016 at 6:35 pm'), 1454870100)
          self.assertEqual(unified_timestamp('2017-03-30T17:52:41Q'), 1490896361)
+        self.assertEqual(unified_timestamp('Sep 11, 2013 | 5:49 AM'), 1378878540)
  
      def test_determine_ext(self):
          self.assertEqual(determine_ext('http://example.com/foo/bar.mp4/?download'), 'mp4')
@@ -678,6 +679,14 @@ class TestUtil(unittest.TestCase):
          d = json.loads(stripped)
          self.assertEqual(d, {'status': 'success'})
  
+        stripped = strip_jsonp('window.cb && window.cb({"status": "success"});')
+        d = json.loads(stripped)
+        self.assertEqual(d, {'status': 'success'})
+
+        stripped = strip_jsonp('window.cb && cb({"status": "success"});')
+        d = json.loads(stripped)
+        self.assertEqual(d, {'status': 'success'})
+
      def test_uppercase_escape(self):
          self.assertEqual(uppercase_escape('aä'), 'aä')
          self.assertEqual(uppercase_escape('\\U0001d550'), '𝕐')
@@ -907,6 +916,8 @@ class TestUtil(unittest.TestCase):
              supports_outside_bmp = False
          if supports_outside_bmp:
              self.assertEqual(extract_attributes('<e x="Smile &#128512;!">'), {'x': 'Smile \U0001f600!'})
+        # Malformed HTML should not break attributes extraction on older Python
+        self.assertEqual(extract_attributes('<mal"formed/>'), {})
  
      def test_clean_html(self):
          self.assertEqual(clean_html('a:\nb'), 'a: b')