Merge branch 'vimeo' of ssh://github.com/rbrito/youtube-dl into vimeo
[youtube-dl] / youtube-dl
index 5a68a2ee9a169039b4ced962d12b5511af7844d7..782372688918ba638206e8a755e849f1ee7527bd 100755 (executable)
@@ -1724,7 +1724,7 @@ class VimeoIE(InfoExtractor):
        """Information extractor for vimeo.com."""
 
        # _VALID_URL matches Vimeo URLs
-       _VALID_URL = r'(?:http://)?vimeo\.com/([0-9]+)'
+       _VALID_URL = r'(?:http://)?(?:(?:www|player).)?vimeo\.com/(?:video/)?([0-9]+)'
 
        def __init__(self, downloader=None):
                InfoExtractor.__init__(self, downloader)
@@ -1765,8 +1765,12 @@ class VimeoIE(InfoExtractor):
                        self._downloader.trouble(u'ERROR: Unable to retrieve video webpage: %s' % str(err))
                        return
 
-               # Extract uploader and title from webpage
+               # Now we begin extracting as much information as we can from what we
+               # retrieved. First we extract the information common to all extractors,
+               # and latter we extract those that are Vimeo specific.
                self.report_extraction(video_id)
+
+               # Extract title
                mobj = re.search(r'<caption>(.*?)</caption>', webpage)
                if mobj is None:
                        self._downloader.trouble(u'ERROR: unable to extract video title')
@@ -1774,6 +1778,7 @@ class VimeoIE(InfoExtractor):
                video_title = mobj.group(1).decode('utf-8')
                simple_title = re.sub(ur'(?u)([^%s]+)' % simple_title_chars, ur'_', video_title)
 
+               # Extract uploader
                mobj = re.search(r'<uploader_url>http://vimeo.com/(.*?)</uploader_url>', webpage)
                if mobj is None:
                        self._downloader.trouble(u'ERROR: unable to extract video uploader')
@@ -1796,14 +1801,14 @@ class VimeoIE(InfoExtractor):
                # if not video_description: video_description = 'No description available.'
                video_description = 'Foo.'
 
-               # Extract request signature
+               # Vimeo specific: extract request signature
                mobj = re.search(r'<request_signature>(.*?)</request_signature>', webpage)
                if mobj is None:
                        self._downloader.trouble(u'ERROR: unable to extract request signature')
                        return
                sig = mobj.group(1).decode('utf-8')
 
-               # Extract request signature expiration
+               # Vimeo specific: Extract request signature expiration
                mobj = re.search(r'<request_signature_expires>(.*?)</request_signature_expires>', webpage)
                if mobj is None:
                        self._downloader.trouble(u'ERROR: unable to extract request signature expiration')