[youtube] fix hd720 format position
[youtube-dl] / youtube_dl / extractor / funk.py
1 # coding: utf-8
2 from __future__ import unicode_literals
3
4 import re
5
6 from .common import InfoExtractor
7 from .nexx import NexxIE
8 from ..utils import (
9     int_or_none,
10     try_get,
11 )
12
13
14 class FunkBaseIE(InfoExtractor):
15     def _make_url_result(self, video):
16         return {
17             '_type': 'url_transparent',
18             'url': 'nexx:741:%s' % video['sourceId'],
19             'ie_key': NexxIE.ie_key(),
20             'id': video['sourceId'],
21             'title': video.get('title'),
22             'description': video.get('description'),
23             'duration': int_or_none(video.get('duration')),
24             'season_number': int_or_none(video.get('seasonNr')),
25             'episode_number': int_or_none(video.get('episodeNr')),
26         }
27
28
29 class FunkMixIE(FunkBaseIE):
30     _VALID_URL = r'https?://(?:www\.)?funk\.net/mix/(?P<id>[^/]+)/(?P<alias>[^/?#&]+)'
31     _TESTS = [{
32         'url': 'https://www.funk.net/mix/59d65d935f8b160001828b5b/die-realste-kifferdoku-aller-zeiten',
33         'md5': '8edf617c2f2b7c9847dfda313f199009',
34         'info_dict': {
35             'id': '123748',
36             'ext': 'mp4',
37             'title': '"Die realste Kifferdoku aller Zeiten"',
38             'description': 'md5:c97160f5bafa8d47ec8e2e461012aa9d',
39             'timestamp': 1490274721,
40             'upload_date': '20170323',
41         },
42     }]
43
44     def _real_extract(self, url):
45         mobj = re.match(self._VALID_URL, url)
46         mix_id = mobj.group('id')
47         alias = mobj.group('alias')
48
49         lists = self._download_json(
50             'https://www.funk.net/api/v3.1/curation/curatedLists/',
51             mix_id, headers={
52                 'authorization': 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJjbGllbnROYW1lIjoiY3VyYXRpb24tdG9vbC12Mi4wIiwic2NvcGUiOiJzdGF0aWMtY29udGVudC1hcGksY3VyYXRpb24tc2VydmljZSxzZWFyY2gtYXBpIn0.SGCC1IXHLtZYoo8PvRKlU2gXH1su8YSu47sB3S4iXBI',
53                 'Referer': url,
54             }, query={
55                 'size': 100,
56             })['result']['lists']
57
58         metas = next(
59             l for l in lists
60             if mix_id in (l.get('entityId'), l.get('alias')))['videoMetas']
61         video = next(
62             meta['videoDataDelegate']
63             for meta in metas if meta.get('alias') == alias)
64
65         return self._make_url_result(video)
66
67
68 class FunkChannelIE(FunkBaseIE):
69     _VALID_URL = r'https?://(?:www\.)?funk\.net/channel/(?P<id>[^/]+)/(?P<alias>[^/?#&]+)'
70     _TESTS = [{
71         'url': 'https://www.funk.net/channel/ba/die-lustigsten-instrumente-aus-dem-internet-teil-2',
72         'info_dict': {
73             'id': '1155821',
74             'ext': 'mp4',
75             'title': 'Die LUSTIGSTEN INSTRUMENTE aus dem Internet - Teil 2',
76             'description': 'md5:a691d0413ef4835588c5b03ded670c1f',
77             'timestamp': 1514507395,
78             'upload_date': '20171229',
79         },
80         'params': {
81             'skip_download': True,
82         },
83     }, {
84         # only available via byIdList API
85         'url': 'https://www.funk.net/channel/informr/martin-sonneborn-erklaert-die-eu',
86         'info_dict': {
87             'id': '205067',
88             'ext': 'mp4',
89             'title': 'Martin Sonneborn erklärt die EU',
90             'description': 'md5:050f74626e4ed87edf4626d2024210c0',
91             'timestamp': 1494424042,
92             'upload_date': '20170510',
93         },
94         'params': {
95             'skip_download': True,
96         },
97     }, {
98         'url': 'https://www.funk.net/channel/59d5149841dca100012511e3/mein-erster-job-lovemilla-folge-1/lovemilla/',
99         'only_matching': True,
100     }]
101
102     def _real_extract(self, url):
103         mobj = re.match(self._VALID_URL, url)
104         channel_id = mobj.group('id')
105         alias = mobj.group('alias')
106
107         headers = {
108             'authorization': 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJjbGllbnROYW1lIjoiY3VyYXRpb24tdG9vbCIsInNjb3BlIjoic3RhdGljLWNvbnRlbnQtYXBpLGN1cmF0aW9uLWFwaSxzZWFyY2gtYXBpIn0.q4Y2xZG8PFHai24-4Pjx2gym9RmJejtmK6lMXP5wAgc',
109             'Referer': url,
110         }
111
112         video = None
113
114         by_id_list = self._download_json(
115             'https://www.funk.net/api/v3.0/content/videos/byIdList', channel_id,
116             headers=headers, query={
117                 'ids': alias,
118             }, fatal=False)
119         if by_id_list:
120             video = try_get(by_id_list, lambda x: x['result'][0], dict)
121
122         if not video:
123             results = self._download_json(
124                 'https://www.funk.net/api/v3.0/content/videos/filter', channel_id,
125                 headers=headers, query={
126                     'channelId': channel_id,
127                     'size': 100,
128                 })['result']
129             video = next(r for r in results if r.get('alias') == alias)
130
131         return self._make_url_result(video)