From: Jaime Marquínez Ferrándiz Date: Thu, 3 Jan 2013 20:05:04 +0000 (+0100) Subject: Allow downloading videos with other characters in their titles X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=commitdiff_plain;h=9cf98a2bcc9cae6bb308b42c0da3587b7d4115f2;p=youtube-dl Allow downloading videos with other characters in their titles Especially html entities --- diff --git a/youtube_dl/InfoExtractors.py b/youtube_dl/InfoExtractors.py index d040eec82..f72defdf2 100755 --- a/youtube_dl/InfoExtractors.py +++ b/youtube_dl/InfoExtractors.py @@ -3694,9 +3694,10 @@ class SteamIE(InfoExtractor): videourl = 'http://store.steampowered.com/video/%s/' % gameID webpage = self._download_webpage(videourl, gameID) mweb = re.finditer(urlRE, webpage) - namesRE = r'(?P[\w:/\.\?=\+\s-]+)' + namesRE = r'(?P.+)' titles = list(re.finditer(namesRE, webpage)) videos = [] + unescaper = compat_html_parser.HTMLParser() for vid,vtitle in zip(mweb,titles): video_id = vid.group('videoID') title = vtitle.group('videoName') @@ -3707,7 +3708,7 @@ class SteamIE(InfoExtractor): 'id':video_id, 'url':video_url, 'ext': 'flv', - 'title': title + 'title': unescaper.unescape(title) } videos.append(info) return videos