From: Jaime Marquínez Ferrándiz Date: Fri, 21 Mar 2014 21:14:24 +0000 (+0100) Subject: Merge remote-tracking branch 'dstftw/generic-webpage-unescape' X-Git-Url: http://git.bitcoin.ninja/index.cgi?p=youtube-dl;a=commitdiff_plain;h=0f2a2ba14b2cbf4bd8bec0ce32f8d7c27a733c68;hp=e24b5a861035c185eacc86a14967e67474235ca7 Merge remote-tracking branch 'dstftw/generic-webpage-unescape' Conflicts: youtube_dl/extractor/generic.py --- diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py index 2254ade90..238913256 100644 --- a/youtube_dl/extractor/generic.py +++ b/youtube_dl/extractor/generic.py @@ -185,7 +185,18 @@ class GenericIE(InfoExtractor): 'uploader': 'Ze Frank', 'description': 'md5:ddb2a40ecd6b6a147e400e535874947b', } - } + }, + # nowvideo embed hidden behind percent encoding + { + 'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/', + 'md5': '2baf4ddd70f697d94b1c18cf796d5107', + 'info_dict': { + 'id': '06e53103ca9aa', + 'ext': 'flv', + 'title': 'Macross Episode 001 Watch Macross Episode 001 onl', + 'description': 'No description', + }, + }, ] def report_download_webpage(self, video_id): @@ -337,6 +348,11 @@ class GenericIE(InfoExtractor): except compat_xml_parse_error: pass + # Sometimes embedded video player is hidden behind percent encoding + # (e.g. https://github.com/rg3/youtube-dl/issues/2448) + # Unescaping the whole page allows to handle those cases in a generic way + webpage = compat_urllib_parse.unquote(webpage) + # it's tempting to parse this further, but you would # have to take into account all the variations like # Video Title - Site Name