Allow downloading videos with other characters in their titles
authorJaime Marquínez Ferrándiz <jaimemf93@gmail.com>
Thu, 3 Jan 2013 20:05:04 +0000 (21:05 +0100)
committerJaime Marquínez Ferrándiz <jaimemf93@gmail.com>
Thu, 3 Jan 2013 20:17:35 +0000 (21:17 +0100)
Especially html entities

youtube_dl/InfoExtractors.py

index d040eec8286d22bea075e2ba95d84f2c6dc24775..f72defdf278afd1a3b1c3fa4ed7673cd4f5316c7 100755 (executable)
@@ -3694,9 +3694,10 @@ class SteamIE(InfoExtractor):
         videourl = 'http://store.steampowered.com/video/%s/' % gameID
         webpage = self._download_webpage(videourl, gameID)
         mweb = re.finditer(urlRE, webpage)
-        namesRE = r'<span class=\"title\">(?P<videoName>[\w:/\.\?=\+\s-]+)</span>'
+        namesRE = r'<span class="title">(?P<videoName>.+)</span>'
         titles = list(re.finditer(namesRE, webpage))
         videos = []
+        unescaper = compat_html_parser.HTMLParser()
         for vid,vtitle in zip(mweb,titles):
             video_id = vid.group('videoID')
             title = vtitle.group('videoName')
@@ -3707,7 +3708,7 @@ class SteamIE(InfoExtractor):
                 'id':video_id,
                 'url':video_url,
                 'ext': 'flv',
-                'title': title
+                'title': unescaper.unescape(title)
                   }
             videos.append(info)
         return videos