SteamIE
authorJaime Marquínez Ferrándiz <jaimemf93@gmail.com>
Tue, 1 Jan 2013 13:12:14 +0000 (14:12 +0100)
committerJaime Marquínez Ferrándiz <jaimemf93@gmail.com>
Tue, 1 Jan 2013 13:12:14 +0000 (14:12 +0100)
youtube_dl/InfoExtractors.py
youtube_dl/__init__.py

index d74751a55b3f3754656ea302f724e0d01f6a0873..d7295ae3fe0bafb87dd3a1ea88e431ffd31cd32f 100755 (executable)
@@ -3756,3 +3756,52 @@ class TweetReelIE(InfoExtractor):
             'upload_date': upload_date
         }
         return [info]
+        
+class SteamIE(InfoExtractor):
+    _VALID_URL = r"""http://store.steampowered.com/ 
+                (?P<urltype>video|app)/ #If the page is only for videos or for a game
+                (?P<gameID>\d+)/?
+                (?P<videoID>\d*)(?P<extra>\??) #For urltype == video we sometimes get the videoID
+                """
+    IE_NAME = u'Steam'
+    
+    def suitable(self, url):
+        """Receives a URL and returns True if suitable for this IE."""
+        return re.match(self._VALID_URL, url, re.VERBOSE) is not None
+        
+    def report_download_video_page(self, game_id):
+        self._downloader.to_screen(u'[%s] %s: Downloading video page' % (self.IE_NAME, game_id))
+        
+    def _real_extract(self, url):
+        m = re.match(self._VALID_URL, url, re.VERBOSE)
+        urlRE = r"'movie_(?P<videoID>\d+)': \{\s*FILENAME: \"(?P<videoURL>[\w:/\.\?=]+)\"(,\s*MOVIE_NAME: \"(?P<videoName>[\w:/\.\?=\+-]+)\")?\s*\},"
+        gameID = m.group('gameID')
+        videourl = 'http://store.steampowered.com/video/%s/' % gameID
+        try:
+            self.report_download_video_page(gameID)
+            urlh = compat_urllib_request.urlopen(videourl)
+            webpage_bytes = urlh.read()
+            webpage = webpage_bytes.decode('utf-8', 'ignore')
+        except (compat_urllib_error.URLError, compat_http_client.HTTPException, socket.error) as err:
+            self._downloader.trouble(u'ERROR: unable to download webpage: %s' % compat_str(err))
+            return
+        mweb = re.finditer(urlRE, webpage)
+        namesRE = r'<span class=\"title\">(?P<videoName>[\w:/\.\?=\+\s-]+)</span>'
+        titles = list(re.finditer(namesRE, webpage))
+        videos = []
+        i = 0
+        for vid in mweb:
+            video_id = vid.group('videoID')
+            title = titles[i].group('videoName')
+            video_url=vid.group('videoURL')
+            if not video_url:
+                self._downloader.trouble(u'ERROR: Cannot find video url for %s' % video_id)
+            i += 1
+            info = {
+                'id':video_id,
+                'url':video_url,
+                'ext': 'flv',
+                'title': title
+                  }
+            videos.append(info)
+        return videos
index 8068810ca19390b3f2e4ebc8bf54cb6fc9337165..62ecdf6b6c97b766ed320488bcdf208307102be1 100644 (file)
@@ -313,6 +313,7 @@ def gen_extractors():
         JustinTVIE(),
         FunnyOrDieIE(),
         TweetReelIE(),
+        SteamIE(),
         GenericIE()
     ]