X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=blobdiff_plain;f=youtube_dl%2Fextractor%2Fmit.py;h=d7ab6a9aef23235d099175c7aff76ddd0ac0f84d;hb=cd5b4b0bc2876e16656d33156754ce3c05aa1619;hp=f50e36cb4fcc82a45d3a5f379beadb2764e2faf9;hpb=13ef5648c4498a58c1994719742ad1dd7e5c1b3d;p=youtube-dl diff --git a/youtube_dl/extractor/mit.py b/youtube_dl/extractor/mit.py index f50e36cb4..d7ab6a9ae 100644 --- a/youtube_dl/extractor/mit.py +++ b/youtube_dl/extractor/mit.py @@ -4,16 +4,17 @@ import re import json from .common import InfoExtractor +from .youtube import YoutubeIE from ..utils import ( - compat_urlparse, clean_html, + ExtractorError, get_element_by_id, ) class TechTVMITIE(InfoExtractor): IE_NAME = 'techtv.mit.edu' - _VALID_URL = r'https?://techtv\.mit\.edu/(videos|embeds)/(?P\d+)' + _VALID_URL = r'https?://techtv\.mit\.edu/(?:videos|embeds)/(?P\d+)' _TEST = { 'url': 'http://techtv.mit.edu/videos/25418-mit-dna-learning-center-set', @@ -27,8 +28,7 @@ class TechTVMITIE(InfoExtractor): } def _real_extract(self, url): - mobj = re.match(self._VALID_URL, url) - video_id = mobj.group('id') + video_id = self._match_id(url) raw_page = self._download_webpage( 'http://techtv.mit.edu/videos/%s' % video_id, video_id) clean_page = re.compile(r'', re.S).sub('', raw_page) @@ -71,7 +71,6 @@ class MITIE(TechTVMITIE): _TEST = { 'url': 'http://video.mit.edu/watch/the-government-is-profiling-you-13222/', - 'file': '.mp4', 'md5': '7db01d5ccc1895fc5010e9c9e13648da', 'info_dict': { 'id': '21783', @@ -88,3 +87,70 @@ class MITIE(TechTVMITIE): embed_url = self._search_regex( r'