Merge remote-tracking branch 'Dineshs91/f4m-2.0'
[youtube-dl] / youtube_dl / extractor / screencastomatic.py
1 # coding: utf-8
2 from __future__ import unicode_literals
3
4 from .common import InfoExtractor
5 from ..compat import compat_urlparse
6 from ..utils import (
7     ExtractorError,
8     js_to_json,
9 )
10
11
12 class ScreencastOMaticIE(InfoExtractor):
13     _VALID_URL = r'https?://screencast-o-matic\.com/watch/(?P<id>[0-9a-zA-Z]+)'
14     _TEST = {
15         'url': 'http://screencast-o-matic.com/watch/c2lD3BeOPl',
16         'md5': '483583cb80d92588f15ccbedd90f0c18',
17         'info_dict': {
18             'id': 'c2lD3BeOPl',
19             'ext': 'mp4',
20             'title': 'Welcome to 3-4 Philosophy @ DECV!',
21             'thumbnail': 're:^https?://.*\.jpg$',
22             'description': 'as the title says! also: some general info re 1) VCE philosophy and 2) distance learning.',
23         }
24     }
25
26     def _real_extract(self, url):
27         video_id = self._match_id(url)
28         webpage = self._download_webpage(url, video_id)
29
30         setup_js = self._search_regex(
31             r"(?s)jwplayer\('mp4Player'\).setup\((\{.*?\})\);",
32             webpage, 'setup code')
33         data = self._parse_json(setup_js, video_id, transform_source=js_to_json)
34         try:
35             video_data = next(
36                 m for m in data['modes'] if m.get('type') == 'html5')
37         except StopIteration:
38             raise ExtractorError('Could not find any video entries!')
39         video_url = compat_urlparse.urljoin(url, video_data['config']['file'])
40         thumbnail = data.get('image')
41
42         return {
43             'id': video_id,
44             'title': self._og_search_title(webpage),
45             'description': self._og_search_description(webpage),
46             'url': video_url,
47             'ext': 'mp4',
48             'thumbnail': thumbnail,
49         }