From: Jaime Marquínez Ferrándiz Date: Thu, 29 Aug 2013 09:35:15 +0000 (+0200) Subject: Fix detection of the webpage charset if it's declared using ' instead of " X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=commitdiff_plain;h=0d75ae2ce313c5738b2bdd9602ab3cc15e78810d;p=youtube-dl Fix detection of the webpage charset if it's declared using ' instead of " Like in "" --- diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py index a2986cebe..77726ee24 100644 --- a/youtube_dl/extractor/common.py +++ b/youtube_dl/extractor/common.py @@ -150,7 +150,7 @@ class InfoExtractor(object): if m: encoding = m.group(1) else: - m = re.search(br']+charset="?([^"]+)[ /">]', + m = re.search(br']+charset=[\'"]?([^\'")]+)[ /\'">]', webpage_bytes[:1024]) if m: encoding = m.group(1).decode('ascii')