]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/atvat.py
[panopto] Add extractors (#2908)
[yt-dlp.git] / yt_dlp / extractor / atvat.py
CommitLineData
d66d43c5
RA
1# coding: utf-8
2from __future__ import unicode_literals
3
49fa4d9a
N
4import datetime
5
d66d43c5
RA
6from .common import InfoExtractor
7from ..utils import (
49fa4d9a
N
8 float_or_none,
9 jwt_encode_hs256,
10 try_get,
5c6dfc1f 11 ExtractorError,
d66d43c5
RA
12)
13
14
15class ATVAtIE(InfoExtractor):
49fa4d9a
N
16 _VALID_URL = r'https?://(?:www\.)?atv\.at/tv/(?:[^/]+/){2,3}(?P<id>.*)'
17
d66d43c5 18 _TESTS = [{
49fa4d9a
N
19 'url': 'https://www.atv.at/tv/bauer-sucht-frau/staffel-18/bauer-sucht-frau/bauer-sucht-frau-staffel-18-folge-3-die-hofwochen',
20 'md5': '3c3b4aaca9f63e32b35e04a9c2515903',
d66d43c5 21 'info_dict': {
49fa4d9a 22 'id': 'v-ce9cgn1e70n5-1',
d66d43c5 23 'ext': 'mp4',
49fa4d9a 24 'title': 'Bauer sucht Frau - Staffel 18 Folge 3 - Die Hofwochen',
d66d43c5
RA
25 }
26 }, {
49fa4d9a 27 'url': 'https://www.atv.at/tv/bauer-sucht-frau/staffel-18/episode-01/bauer-sucht-frau-staffel-18-vorstellungsfolge-1',
d66d43c5
RA
28 'only_matching': True,
29 }]
30
49fa4d9a
N
31 # extracted from bootstrap.js function (search for e.encryption_key and use your browser's debugger)
32 _ACCESS_ID = 'x_atv'
33 _ENCRYPTION_KEY = 'Hohnaekeishoogh2omaeghooquooshia'
9a292a62 34
49fa4d9a
N
35 def _extract_video_info(self, url, content, video):
36 clip_id = content.get('splitId', content['id'])
9a292a62 37 formats = []
49fa4d9a
N
38 clip_urls = video['urls']
39 for protocol, variant in clip_urls.items():
40 source_url = try_get(variant, lambda x: x['clear']['url'])
41 if not source_url:
42 continue
43 if protocol == 'dash':
44 formats.extend(self._extract_mpd_formats(
45 source_url, clip_id, mpd_id=protocol, fatal=False))
46 elif protocol == 'hls':
47 formats.extend(self._extract_m3u8_formats(
48 source_url, clip_id, 'mp4', 'm3u8_native',
49 m3u8_id=protocol, fatal=False))
50 else:
51 formats.append({
52 'url': source_url,
53 'format_id': protocol,
54 })
9a292a62 55 self._sort_formats(formats)
49fa4d9a 56
9a292a62 57 return {
49fa4d9a
N
58 'id': clip_id,
59 'title': content.get('title'),
60 'duration': float_or_none(content.get('duration')),
61 'series': content.get('tvShowTitle'),
62 'formats': formats,
9a292a62 63 }
64
d66d43c5 65 def _real_extract(self, url):
49fa4d9a
N
66 video_id = self._match_id(url)
67 webpage = self._download_webpage(url, video_id)
68 json_data = self._parse_json(
69 self._search_regex(r'<script id="state" type="text/plain">(.*)</script>', webpage, 'json_data'),
70 video_id=video_id)
71
72 video_title = json_data['views']['default']['page']['title']
73 contentResource = json_data['views']['default']['page']['contentResource']
74 content_id = contentResource[0]['id']
75 content_ids = [{'id': id, 'subclip_start': content['start'], 'subclip_end': content['end']}
76 for id, content in enumerate(contentResource)]
77
78 time_of_request = datetime.datetime.now()
79 not_before = time_of_request - datetime.timedelta(minutes=5)
80 expire = time_of_request + datetime.timedelta(minutes=5)
81 payload = {
82 'content_ids': {
83 content_id: content_ids,
84 },
85 'secure_delivery': True,
86 'iat': int(time_of_request.timestamp()),
87 'nbf': int(not_before.timestamp()),
88 'exp': int(expire.timestamp()),
89 }
90 jwt_token = jwt_encode_hs256(payload, self._ENCRYPTION_KEY, headers={'kid': self._ACCESS_ID})
91 videos = self._download_json(
92 'https://vas-v4.p7s1video.net/4.0/getsources',
93 content_id, 'Downloading videos JSON', query={
94 'token': jwt_token.decode('utf-8')
95 })
d66d43c5 96
49fa4d9a 97 video_id, videos_data = list(videos['data'].items())[0]
5c6dfc1f 98 error_msg = try_get(videos_data, lambda x: x['error']['title'])
99 if error_msg == 'Geo check failed':
100 self.raise_geo_restricted(error_msg)
101 elif error_msg:
102 raise ExtractorError(error_msg)
49fa4d9a
N
103 entries = [
104 self._extract_video_info(url, contentResource[video['id']], video)
105 for video in videos_data]
d66d43c5
RA
106
107 return {
108 '_type': 'multi_video',
109 'id': video_id,
110 'title': video_title,
49fa4d9a 111 'entries': entries,
d66d43c5 112 }