From: Yen Chi Hsuan Date: Fri, 9 Oct 2015 06:11:00 +0000 (+0800) Subject: [extractor/common] Allow HTML5 unquoted attribute values X-Git-Url: http://git.bitcoin.ninja/index.cgi?p=youtube-dl;a=commitdiff_plain;h=57935b2564c082b90a60468d4c844b219118886a [extractor/common] Allow HTML5 unquoted attribute values Fixes #7108 HTML5 allows unquoted attribute values. See the "Unquoted attribute value syntax" section [1] for more information [1] http://www.w3.org/TR/html5/syntax.html --- diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py index dbae75406..242618c58 100644 --- a/youtube_dl/extractor/common.py +++ b/youtube_dl/extractor/common.py @@ -646,7 +646,7 @@ class InfoExtractor(object): @staticmethod def _og_regexes(prop): content_re = r'content=(?:"([^>]+?)"|\'([^>]+?)\')' - property_re = r'(?:name|property)=[\'"]og:%s[\'"]' % re.escape(prop) + property_re = r'(?:name|property)=[\'"]?og:%s[\'"]?' % re.escape(prop) template = r']+?%s[^>]+?%s' return [ template % (property_re, content_re),