X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=blobdiff_plain;f=youtube_dl%2Fextractor%2Fkeek.py;h=94a03d277a227733480b8a73f5535f9f3410be15;hb=2f483bc1c389709623117079439708783122b5ec;hp=5d679e88d811c6ad55c9fe475267c2842a641f83;hpb=5aaca50d60cf2dfbc548dd14dc0289dcd0a4d89b;p=youtube-dl diff --git a/youtube_dl/extractor/keek.py b/youtube_dl/extractor/keek.py index 5d679e88d..94a03d277 100644 --- a/youtube_dl/extractor/keek.py +++ b/youtube_dl/extractor/keek.py @@ -1,40 +1,39 @@ +# coding: utf-8 from __future__ import unicode_literals -import re - from .common import InfoExtractor class KeekIE(InfoExtractor): - _VALID_URL = r'https?://(?:www\.)?keek\.com/(?:!|\w+/keeks/)(?P\w+)' + _VALID_URL = r'https?://(?:www\.)?keek\.com/keek/(?P\w+)' IE_NAME = 'keek' _TEST = { - 'url': 'https://www.keek.com/ytdl/keeks/NODfbab', - 'file': 'NODfbab.mp4', + 'url': 'https://www.keek.com/keek/NODfbab', 'md5': '9b0636f8c0f7614afa4ea5e4c6e57e83', 'info_dict': { + 'id': 'NODfbab', + 'ext': 'mp4', + 'title': 'md5:35d42050a3ece241d5ddd7fdcc6fd896', 'uploader': 'ytdl', - 'title': 'test chars: "\'/\\\u00e4<>This is a test video for youtube-dl.For more information, contact phihag@phihag.de .', + 'uploader_id': 'eGT5bab', }, } def _real_extract(self, url): - m = re.match(self._VALID_URL, url) - video_id = m.group('videoID') + video_id = self._match_id(url) - video_url = 'http://cdn.keek.com/keek/video/%s' % video_id - thumbnail = 'http://cdn.keek.com/keek/thumbnail/%s/w100/h75' % video_id webpage = self._download_webpage(url, video_id) - uploader = self._html_search_regex( - r'
[\S\s]+?

(?P.+?)

', - webpage, 'uploader', fatal=False) - return { 'id': video_id, - 'url': video_url, + 'url': self._og_search_video_url(webpage), 'ext': 'mp4', - 'title': self._og_search_title(webpage), - 'thumbnail': thumbnail, - 'uploader': uploader + 'title': self._og_search_description(webpage).strip(), + 'thumbnail': self._og_search_thumbnail(webpage), + 'uploader': self._search_regex( + r'data-username=(["\'])(?P.+?)\1', webpage, + 'uploader', fatal=False, group='uploader'), + 'uploader_id': self._search_regex( + r'data-user-id=(["\'])(?P.+?)\1', webpage, + 'uploader id', fatal=False, group='uploader_id'), }