]> jfr.im git - yt-dlp.git/blame - youtube_dl/extractor/hypem.py
Add support for https for all extractors as preventive and future-proof measure
[yt-dlp.git] / youtube_dl / extractor / hypem.py
CommitLineData
2656f4eb
PH
1from __future__ import unicode_literals
2
27110b05 3import json
27110b05
PH
4import time
5
6from .common import InfoExtractor
5c2266df 7from ..compat import compat_urllib_parse
1cc79574 8from ..utils import (
27110b05 9 ExtractorError,
5c2266df 10 sanitized_Request,
27110b05
PH
11)
12
13
14class HypemIE(InfoExtractor):
5886b38d 15 _VALID_URL = r'https?://(?:www\.)?hypem\.com/track/(?P<id>[^/]+)/'
6f5ac90c 16 _TEST = {
2656f4eb
PH
17 'url': 'http://hypem.com/track/1v6ga/BODYWORK+-+TAME',
18 'md5': 'b9cc91b5af8995e9f0c1cee04c575828',
19 'info_dict': {
20 'id': '1v6ga',
21 'ext': 'mp3',
22 'title': 'Tame',
23 'uploader': 'BODYWORK',
6f5ac90c
PH
24 }
25 }
27110b05
PH
26
27 def _real_extract(self, url):
1cc79574 28 track_id = self._match_id(url)
27110b05 29
a56f9de1 30 data = {'ax': 1, 'ts': time.time()}
960e0388 31 request = sanitized_Request(url + '?' + compat_urllib_parse.urlencode(data))
2656f4eb
PH
32 response, urlh = self._download_webpage_handle(
33 request, track_id, 'Downloading webpage with the url')
27110b05 34
2656f4eb 35 html_tracks = self._html_search_regex(
960e0388 36 r'(?ms)<script type="application/json" id="displayList-data">(.+?)</script>',
2656f4eb 37 response, 'tracks')
27110b05
PH
38 try:
39 track_list = json.loads(html_tracks)
2656f4eb 40 track = track_list['tracks'][0]
27110b05 41 except ValueError:
2656f4eb 42 raise ExtractorError('Hypemachine contained invalid JSON.')
27110b05 43
2656f4eb
PH
44 key = track['key']
45 track_id = track['id']
2656f4eb 46 title = track['song']
27110b05 47
5c2266df 48 request = sanitized_Request(
960e0388
S
49 'http://hypem.com/serve/source/%s/%s' % (track_id, key),
50 '', {'Content-Type': 'application/json'})
2656f4eb 51 song_data = self._download_json(request, track_id, 'Downloading metadata')
960e0388
S
52 final_url = song_data['url']
53 artist = track.get('artist')
27110b05 54
2656f4eb
PH
55 return {
56 'id': track_id,
57 'url': final_url,
58 'ext': 'mp3',
59 'title': title,
60 'uploader': artist,
61 }