Merge remote-tracking branch 'Rudloff/websurg'
[youtube-dl] / youtube_dl / extractor / websurg.py
1 # coding: utf-8
2
3 import re
4
5 from ..utils import (
6     compat_urllib_request,
7     compat_urllib_parse
8 )
9
10 from .common import InfoExtractor
11
12 class WeBSurgIE(InfoExtractor):
13     IE_NAME = u'websurg.com'
14     _VALID_URL = r'http://.*?\.websurg\.com/MEDIA/\?noheader=1&doi=(.*)'
15
16     _TEST = {
17         u'url': u'http://www.websurg.com/MEDIA/?noheader=1&doi=vd01en4012',
18         u'file': u'vd01en4012.mp4',
19         u'params': {
20             u'skip_download': True,
21         }
22     }
23     
24     _LOGIN_URL = 'http://www.websurg.com/inc/login/login_div.ajax.php?login=1'
25
26     def _real_initialize(self):
27
28         login_form = {
29             'username': self._downloader.params['username'],
30             'password': self._downloader.params['password'],
31             'Submit': 1
32         }
33         
34         request = compat_urllib_request.Request(
35             self._LOGIN_URL, compat_urllib_parse.urlencode(login_form))
36         request.add_header(
37             'Content-Type', 'application/x-www-form-urlencoded;charset=utf-8')
38         compat_urllib_request.urlopen(request).info()
39         webpage = self._download_webpage(self._LOGIN_URL, '', 'Logging in')
40         
41         if webpage != 'OK':
42             self._downloader.report_error(
43                 u'Unable to log in: bad username/password')
44         
45     def _real_extract(self, url):
46         video_id = re.match(self._VALID_URL, url).group(1)
47         
48         webpage = self._download_webpage(url, video_id)
49         
50         url_info = re.search(r'streamer="(.*?)" src="(.*?)"', webpage)
51         
52         return {'id': video_id,
53                 'title': self._og_search_title(webpage),
54                 'description': self._og_search_description(webpage),
55                 'ext' : 'mp4',
56                 'url' : url_info.group(1) + '/' + url_info.group(2),
57                 'thumbnail': self._og_search_thumbnail(webpage)
58                 }