[hypem] Modernize
[youtube-dl] / youtube_dl / extractor / hypem.py
1 from __future__ import unicode_literals
2
3 import json
4 import re
5 import time
6
7 from .common import InfoExtractor
8 from ..utils import (
9     compat_str,
10     compat_urllib_parse,
11     compat_urllib_request,
12
13     ExtractorError,
14 )
15
16
17 class HypemIE(InfoExtractor):
18     _VALID_URL = r'http://(?:www\.)?hypem\.com/track/([^/]+)/([^/]+)'
19     _TEST = {
20         'url': 'http://hypem.com/track/1v6ga/BODYWORK+-+TAME',
21         'md5': 'b9cc91b5af8995e9f0c1cee04c575828',
22         'info_dict': {
23             'id': '1v6ga',
24             'ext': 'mp3',
25             'title': 'Tame',
26             'uploader': 'BODYWORK',
27         }
28     }
29
30     def _real_extract(self, url):
31         mobj = re.match(self._VALID_URL, url)
32         track_id = mobj.group(1)
33
34         data = {'ax': 1, 'ts': time.time()}
35         data_encoded = compat_urllib_parse.urlencode(data)
36         complete_url = url + "?" + data_encoded
37         request = compat_urllib_request.Request(complete_url)
38         response, urlh = self._download_webpage_handle(
39             request, track_id, 'Downloading webpage with the url')
40         cookie = urlh.headers.get('Set-Cookie', '')
41
42         html_tracks = self._html_search_regex(
43             r'(?ms)<script type="application/json" id="displayList-data">\s*(.*?)\s*</script>',
44             response, 'tracks')
45         try:
46             track_list = json.loads(html_tracks)
47             track = track_list['tracks'][0]
48         except ValueError:
49             raise ExtractorError('Hypemachine contained invalid JSON.')
50
51         key = track['key']
52         track_id = track['id']
53         artist = track['artist']
54         title = track['song']
55
56         serve_url = "http://hypem.com/serve/source/%s/%s" % (track_id, key)
57         request = compat_urllib_request.Request(
58             serve_url, '', {'Content-Type': 'application/json'})
59         request.add_header('cookie', cookie)
60         song_data = self._download_json(request, track_id, 'Downloading metadata')
61         final_url = song_data["url"]
62
63         return {
64             'id': track_id,
65             'url': final_url,
66             'ext': 'mp3',
67             'title': title,
68             'uploader': artist,
69         }