X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=blobdiff_plain;f=youtube_dl%2Fextractor%2Frtbf.py;h=dce64e1517003015722db1097ac83b106cc91136;hb=cc7fec5818254f4679896823c7de9d17f50201ca;hp=544539665567bbb197f6c1132ff971fde4edc66f;hpb=98b7d476d92f7b83c5862395453a4ba47771d890;p=youtube-dl diff --git a/youtube_dl/extractor/rtbf.py b/youtube_dl/extractor/rtbf.py index 544539665..dce64e151 100644 --- a/youtube_dl/extractor/rtbf.py +++ b/youtube_dl/extractor/rtbf.py @@ -5,10 +5,10 @@ import re import json from .common import InfoExtractor -from ..utils import clean_html -class RTBFVideoIE(InfoExtractor): - _VALID_URL = r'https?://www.rtbf.be/video/(?P[^?]+)\?.*id=(?P<id>[0-9]+)' + +class RTBFIE(InfoExtractor): + _VALID_URL = r'https?://www.rtbf.be/video/[^\?]+\?id=(?P<id>\d+)' _TEST = { 'url': 'https://www.rtbf.be/video/detail_les-diables-au-coeur-episode-2?id=1921274', 'md5': '799f334ddf2c0a582ba80c44655be570', @@ -16,7 +16,10 @@ class RTBFVideoIE(InfoExtractor): 'id': '1921274', 'ext': 'mp4', 'title': 'Les Diables au coeur (épisode 2)', + 'description': 'Football - Diables Rouges', 'duration': 3099, + 'timestamp': 1398456336, + 'upload_date': '20140425', } } @@ -24,25 +27,23 @@ class RTBFVideoIE(InfoExtractor): mobj = re.match(self._VALID_URL, url) video_id = mobj.group('id') - # TODO more code goes here, for example ... - webpage = self._download_webpage(url, video_id) - title = self._html_search_regex( - r'<meta property="og:description" content="([^"]*)"', - webpage, 'title', mobj.group('title')) + page = self._download_webpage('https://www.rtbf.be/video/embed?id=%s' % video_id, video_id) + + data = json.loads(self._html_search_regex( + r'<div class="js-player-embed(?: player-embed)?" data-video="([^"]+)"', page, 'data video'))['data'] - iframe_url = self._html_search_regex(r'<iframe [^>]*src="([^"]+)"', - webpage, 'iframe') - iframe = self._download_webpage(iframe_url, video_id) + video_url = data.get('downloadUrl') or data.get('url') - data_video_idx = iframe.find('data-video') - next_data_idx = iframe.find('data-', data_video_idx + 1) - json_data_start = data_video_idx + len('data-video=') + 1 - json_data_end = next_data_idx - 2 - video_data = json.loads(clean_html(iframe[json_data_start:json_data_end])) + if data['provider'].lower() == 'youtube': + return self.url_result(video_url, 'Youtube') return { 'id': video_id, - 'title': title, - 'url': video_data['data']['downloadUrl'], - 'duration': video_data['data']['duration'], + 'url': video_url, + 'title': data['title'], + 'description': data.get('description') or data.get('subtitle'), + 'thumbnail': data['thumbnail']['large'], + 'duration': data.get('duration') or data.get('realDuration'), + 'timestamp': data['created'], + 'view_count': data['viewCount'], }