Merge remote-tracking branch 'sahutd/master'

[youtube-dl] / youtube_dl / extractor / vimeo.py
diff --git a/youtube_dl/extractor/vimeo.py b/youtube_dl/extractor/vimeo.py

index 54b550b0c61d54fd6a34eeb92aa99dd9cf7c8755..a50170ce76923837717dec6df19a558734d46e4e 100644 (file)
--- a/youtube_dl/extractor/vimeo.py
+++ b/youtube_dl/extractor/vimeo.py
@@ -24,7 +24,7 @@ class VimeoIE(InfoExtractor):
  
      # _VALID_URL matches Vimeo URLs
      _VALID_URL = r'''(?x)
-        (?P<proto>https?://)?
+        (?P<proto>(?:https?:)?//)?
          (?:(?:www|(?P<player>player))\.)?
          vimeo(?P<pro>pro)?\.com/
          (?:.*?/)?
@@ -93,7 +93,7 @@ class VimeoIE(InfoExtractor):
          self.report_login()
          login_url = 'https://vimeo.com/log_in'
          webpage = self._download_webpage(login_url, None, False)
-        token = re.search(r'xsrft: \'(.*?)\'', webpage).group(1)
+        token = self._search_regex(r'xsrft: \'(.*?)\'', webpage, 'login token')
          data = compat_urllib_parse.urlencode({'email': username,
                                                'password': password,
                                                'action': 'login',
@@ -109,7 +109,7 @@ class VimeoIE(InfoExtractor):
          password = self._downloader.params.get('videopassword', None)
          if password is None:
              raise ExtractorError('This video is protected by a password, use the --video-password option')
-        token = re.search(r'xsrft: \'(.*?)\'', webpage).group(1)
+        token = self._search_regex(r'xsrft: \'(.*?)\'', webpage, 'login token')
          data = compat_urllib_parse.urlencode({'password': password,
                                                'token': token})
          # I didn't manage to use the password with https
@@ -124,6 +124,19 @@ class VimeoIE(InfoExtractor):
                                 'Verifying the password',
                                 'Wrong password')
  
+    def _verify_player_video_password(self, url, video_id):
+        password = self._downloader.params.get('videopassword', None)
+        if password is None:
+            raise ExtractorError('This video is protected by a password, use the --video-password option')
+        data = compat_urllib_parse.urlencode({'password': password})
+        pass_url = url + '/check-password'
+        password_request = compat_urllib_request.Request(pass_url, data)
+        password_request.add_header('Content-Type', 'application/x-www-form-urlencoded')
+        return self._download_json(
+            password_request, video_id,
+            'Verifying the password',
+            'Wrong password')
+
      def _real_initialize(self):
          self._login()
  
@@ -136,9 +149,6 @@ class VimeoIE(InfoExtractor):
  
          # Extract ID from URL
          mobj = re.match(self._VALID_URL, url)
-        if mobj is None:
-            raise ExtractorError('Invalid URL: %s' % url)
-
          video_id = mobj.group('id')
          if mobj.group('pro') or mobj.group('player'):
              url = 'http://player.vimeo.com/video/' + video_id
@@ -184,8 +194,7 @@ class VimeoIE(InfoExtractor):
                                       cause=e)
          else:
              if config.get('view') == 4:
-                self._verify_video_password(url, video_id, webpage)
-                return self._real_extract(url)
+                config = self._verify_player_video_password(url, video_id)
  
          # Extract title
          video_title = config["video"]["title"]
@@ -282,7 +291,7 @@ class VimeoIE(InfoExtractor):
  
  class VimeoChannelIE(InfoExtractor):
      IE_NAME = 'vimeo:channel'
-    _VALID_URL = r'(?:https?://)?vimeo.\com/channels/(?P<id>[^/]+)'
+    _VALID_URL = r'(?:https?://)?vimeo\.com/channels/(?P<id>[^/]+)'
      _MORE_PAGES_INDICATOR = r'<a.+?rel="next"'
      _TITLE_RE = r'<link rel="alternate"[^>]+?title="(.*?)"'
  
@@ -318,7 +327,7 @@ class VimeoChannelIE(InfoExtractor):
  
  class VimeoUserIE(VimeoChannelIE):
      IE_NAME = 'vimeo:user'
-    _VALID_URL = r'(?:https?://)?vimeo.\com/(?P<name>[^/]+)(?:[#?]|$)'
+    _VALID_URL = r'(?:https?://)?vimeo\.com/(?P<name>[^/]+)(?:/videos|[#?]|$)'
      _TITLE_RE = r'<a[^>]+?class="user">([^<>]+?)</a>'
  
      @classmethod
@@ -335,7 +344,7 @@ class VimeoUserIE(VimeoChannelIE):
  
  class VimeoAlbumIE(VimeoChannelIE):
      IE_NAME = 'vimeo:album'
-    _VALID_URL = r'(?:https?://)?vimeo.\com/album/(?P<id>\d+)'
+    _VALID_URL = r'(?:https?://)?vimeo\.com/album/(?P<id>\d+)'
      _TITLE_RE = r'<header id="page_header">\n\s*<h1>(.*?)</h1>'
  
      def _page_url(self, base_url, pagenum):
@@ -349,7 +358,7 @@ class VimeoAlbumIE(VimeoChannelIE):
  
  class VimeoGroupsIE(VimeoAlbumIE):
      IE_NAME = 'vimeo:group'
-    _VALID_URL = r'(?:https?://)?vimeo.\com/groups/(?P<name>[^/]+)'
+    _VALID_URL = r'(?:https?://)?vimeo\.com/groups/(?P<name>[^/]+)'
  
      def _extract_list_title(self, webpage):
          return self._og_search_title(webpage)
@@ -363,7 +372,7 @@ class VimeoGroupsIE(VimeoAlbumIE):
  class VimeoReviewIE(InfoExtractor):
      IE_NAME = 'vimeo:review'
      IE_DESC = 'Review pages on vimeo'
-    _VALID_URL = r'(?:https?://)?vimeo.\com/[^/]+/review/(?P<id>[^/]+)'
+    _VALID_URL = r'(?:https?://)?vimeo\.com/[^/]+/review/(?P<id>[^/]+)'
      _TEST = {
          'url': 'https://vimeo.com/user21297594/review/75524534/3c257a1b5d',
          'file': '75524534.mp4',