]> jfr.im git - yt-dlp.git/blame - youtube_dl/extractor/vgtv.py
[lrt] Add new extractor
[yt-dlp.git] / youtube_dl / extractor / vgtv.py
CommitLineData
78149a96
MK
1# coding: utf-8
2from __future__ import unicode_literals
3
4import re
5
6from .common import InfoExtractor
321c1e44 7from ..utils import float_or_none
78149a96 8
78149a96
MK
9
10class VGTVIE(InfoExtractor):
321c1e44
S
11 _VALID_URL = r'http://(?:www\.)?vgtv\.no/#!/(?:.*)/(?P<id>[0-9]+)'
12 _TESTS = [
13 {
14 # streamType: vod
15 'url': 'http://www.vgtv.no/#!/video/84196/hevnen-er-soet-episode-10-abu',
16 'md5': 'b8be7a234cebb840c0d512c78013e02f',
17 'info_dict': {
18 'id': '84196',
19 'ext': 'mp4',
20 'title': 'Hevnen er søt episode 10: Abu',
21 'description': 'md5:e25e4badb5f544b04341e14abdc72234',
22 'thumbnail': 're:^https?://.*\.jpg',
23 'duration': 648.000,
24 'timestamp': 1404626400,
3fbeb95e
S
25 'upload_date': '20140706',
26 'view_count': int,
321c1e44
S
27 },
28 },
29 {
30 # streamType: wasLive
31 'url': 'http://www.vgtv.no/#!/live/100764/opptak-vgtv-foelger-em-kvalifiseringen',
32 'info_dict': {
33 'id': '100764',
34 'ext': 'mp4',
35 'title': 'OPPTAK: VGTV følger EM-kvalifiseringen',
36 'description': 'md5:3772d9c0dc2dff92a886b60039a7d4d3',
37 'thumbnail': 're:^https?://.*\.jpg',
38 'duration': 9056.000,
39 'timestamp': 1410113864,
3fbeb95e
S
40 'upload_date': '20140907',
41 'view_count': int,
321c1e44
S
42 },
43 'params': {
44 # m3u8 download
45 'skip_download': True,
46 },
47 },
48 {
49 # streamType: live
50 'url': 'http://www.vgtv.no/#!/live/100015/direkte-her-kan-du-se-laksen-live-fra-suldalslaagen',
51 'info_dict': {
52 'id': '100015',
53 'ext': 'mp4',
54 'title': 'DIREKTE: Her kan du se laksen live fra Suldalslågen!',
55 'description': 'md5:9a60cc23fa349f761628924e56eeec2d',
56 'thumbnail': 're:^https?://.*\.jpg',
57 'duration': 0,
58 'timestamp': 1407423348,
3fbeb95e
S
59 'upload_date': '20140807',
60 'view_count': int,
321c1e44
S
61 },
62 'params': {
63 # m3u8 download
64 'skip_download': True,
65 },
66 },
67 ]
78149a96 68
321c1e44
S
69 def _real_extract(self, url):
70 mobj = re.match(self._VALID_URL, url)
71 video_id = mobj.group('id')
78149a96 72
321c1e44
S
73 data = self._download_json(
74 'http://svp.vg.no/svp/api/v1/vgtv/assets/%s?appName=vgtv-website' % video_id,
75 video_id, 'Downloading media JSON')
78149a96 76
321c1e44 77 streams = data['streamUrls']
78149a96 78
321c1e44 79 formats = []
78149a96 80
321c1e44
S
81 hls_url = streams.get('hls')
82 if hls_url:
83 formats.extend(self._extract_m3u8_formats(hls_url, video_id, 'mp4'))
78149a96 84
321c1e44
S
85 hds_url = streams.get('hds')
86 if hds_url:
87 formats.extend(self._extract_f4m_formats(hds_url + '?hdcore=3.2.0&plugin=aasp-3.2.0.77.18', video_id))
78149a96 88
321c1e44
S
89 mp4_url = streams.get('mp4')
90 if mp4_url:
91 _url = hls_url or hds_url
92 MP4_URL_TEMPLATE = '%s/%%s.%s' % (mp4_url.rpartition('/')[0], mp4_url.rpartition('.')[-1])
93 for mp4_format in _url.split(','):
94 m = re.search('(?P<width>\d+)_(?P<height>\d+)_(?P<vbr>\d+)', mp4_format)
95 if not m:
96 continue
97 width = int(m.group('width'))
98 height = int(m.group('height'))
99 vbr = int(m.group('vbr'))
100 formats.append({
101 'url': MP4_URL_TEMPLATE % mp4_format,
102 'format_id': 'mp4-%s' % vbr,
103 'width': width,
104 'height': height,
105 'vbr': vbr,
106 'preference': 1,
107 })
108 self._sort_formats(formats)
109
110 return {
111 'id': video_id,
112 'title': data['title'],
113 'description': data['description'],
114 'thumbnail': data['images']['main'] + '?t[]=900x506q80',
115 'timestamp': data['published'],
116 'duration': float_or_none(data['duration'], 1000),
117 'view_count': data['displays'],
118 'formats': formats,
119 }