]> jfr.im git - yt-dlp.git/blame - youtube_dl/extractor/hypem.py
[southpark:de] Add test for non-ASCII in URLs
[yt-dlp.git] / youtube_dl / extractor / hypem.py
CommitLineData
2656f4eb
PH
1from __future__ import unicode_literals
2
27110b05 3import json
27110b05
PH
4import time
5
6from .common import InfoExtractor
1cc79574 7from ..compat import (
27110b05
PH
8 compat_urllib_parse,
9 compat_urllib_request,
1cc79574
PH
10)
11from ..utils import (
27110b05
PH
12 ExtractorError,
13)
14
15
16class HypemIE(InfoExtractor):
1cc79574 17 _VALID_URL = r'http://(?:www\.)?hypem\.com/track/(?P<id>[^/]+)/'
6f5ac90c 18 _TEST = {
2656f4eb
PH
19 'url': 'http://hypem.com/track/1v6ga/BODYWORK+-+TAME',
20 'md5': 'b9cc91b5af8995e9f0c1cee04c575828',
21 'info_dict': {
22 'id': '1v6ga',
23 'ext': 'mp3',
24 'title': 'Tame',
25 'uploader': 'BODYWORK',
6f5ac90c
PH
26 }
27 }
27110b05
PH
28
29 def _real_extract(self, url):
1cc79574 30 track_id = self._match_id(url)
27110b05 31
a56f9de1 32 data = {'ax': 1, 'ts': time.time()}
27110b05
PH
33 data_encoded = compat_urllib_parse.urlencode(data)
34 complete_url = url + "?" + data_encoded
35 request = compat_urllib_request.Request(complete_url)
2656f4eb
PH
36 response, urlh = self._download_webpage_handle(
37 request, track_id, 'Downloading webpage with the url')
27110b05
PH
38 cookie = urlh.headers.get('Set-Cookie', '')
39
2656f4eb
PH
40 html_tracks = self._html_search_regex(
41 r'(?ms)<script type="application/json" id="displayList-data">\s*(.*?)\s*</script>',
42 response, 'tracks')
27110b05
PH
43 try:
44 track_list = json.loads(html_tracks)
2656f4eb 45 track = track_list['tracks'][0]
27110b05 46 except ValueError:
2656f4eb 47 raise ExtractorError('Hypemachine contained invalid JSON.')
27110b05 48
2656f4eb
PH
49 key = track['key']
50 track_id = track['id']
51 artist = track['artist']
52 title = track['song']
27110b05 53
2656f4eb
PH
54 serve_url = "http://hypem.com/serve/source/%s/%s" % (track_id, key)
55 request = compat_urllib_request.Request(
56 serve_url, '', {'Content-Type': 'application/json'})
27110b05 57 request.add_header('cookie', cookie)
2656f4eb
PH
58 song_data = self._download_json(request, track_id, 'Downloading metadata')
59 final_url = song_data["url"]
27110b05 60
2656f4eb
PH
61 return {
62 'id': track_id,
63 'url': final_url,
64 'ext': 'mp3',
65 'title': title,
66 'uploader': artist,
67 }