]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/fox.py
[ie/matchtv] Fix extractor (#10190)
[yt-dlp.git] / yt_dlp / extractor / fox.py
CommitLineData
41c2c254 1import json
add96eb9 2import urllib.parse
41c2c254 3import uuid
96c186e1 4
443f8de8 5from .common import InfoExtractor
3d2623a8 6from ..networking.exceptions import HTTPError
e37b54b1 7from ..utils import (
0d08bcdb 8 ExtractorError,
bf6ec2fe
S
9 int_or_none,
10 parse_age_limit,
11 parse_duration,
42a44f01 12 traverse_obj,
bf6ec2fe
S
13 try_get,
14 unified_timestamp,
42a44f01 15 url_or_none,
e37b54b1 16)
9787c5f4 17
18
443f8de8 19class FOXIE(InfoExtractor):
30b29f37 20 _VALID_URL = r'https?://(?:www\.)?fox(?:sports)?\.com/(?:watch|replay)/(?P<id>[\da-fA-F]+)'
bf6ec2fe
S
21 _TESTS = [{
22 # clip
23 'url': 'https://www.fox.com/watch/4b765a60490325103ea69888fb2bd4e8/',
5e3a6fec 24 'md5': 'ebd296fcc41dd4b19f8115d8461a3165',
9787c5f4 25 'info_dict': {
bf6ec2fe 26 'id': '4b765a60490325103ea69888fb2bd4e8',
9787c5f4 27 'ext': 'mp4',
bf6ec2fe
S
28 'title': 'Aftermath: Bruce Wayne Develops Into The Dark Knight',
29 'description': 'md5:549cd9c70d413adb32ce2a779b53b486',
30 'duration': 102,
31 'timestamp': 1504291893,
32 'upload_date': '20170901',
33 'creator': 'FOX',
34 'series': 'Gotham',
6df196f3 35 'age_limit': 14,
42a44f01
VK
36 'episode': 'Aftermath: Bruce Wayne Develops Into The Dark Knight',
37 'thumbnail': r're:^https?://.*\.jpg$',
9787c5f4 38 },
bf6ec2fe
S
39 'params': {
40 'skip_download': True,
41 },
42 }, {
43 # episode, geo-restricted
44 'url': 'https://www.fox.com/watch/087036ca7f33c8eb79b08152b4dd75c1/',
45 'only_matching': True,
46 }, {
443f8de8 47 # sports event, geo-restricted
48 'url': 'https://www.fox.com/watch/b057484dade738d1f373b3e46216fa2c/',
bf6ec2fe 49 'only_matching': True,
30b29f37 50 }, {
51 # fox sports replay, geo-restricted
52 'url': 'https://www.foxsports.com/replay/561f3e071347a24e5e877abc56b22e89',
53 'only_matching': True,
bf6ec2fe 54 }]
0d08bcdb 55 _GEO_BYPASS = False
6df196f3 56 _HOME_PAGE_URL = 'https://www.fox.com/'
443f8de8 57 _API_KEY = '6E9S4bmcoNnZwVLOHywOv8PJEdu76cM9'
41c2c254 58 _access_token = None
add96eb9 59 _device_id = str(uuid.uuid4())
96c186e1 60
41c2c254
RA
61 def _call_api(self, path, video_id, data=None):
62 headers = {
6df196f3 63 'X-Api-Key': self._API_KEY,
41c2c254
RA
64 }
65 if self._access_token:
66 headers['Authorization'] = 'Bearer ' + self._access_token
0d08bcdb
RA
67 try:
68 return self._download_json(
443f8de8 69 'https://api3.fox.com/v2.0/' + path,
0d08bcdb
RA
70 video_id, data=data, headers=headers)
71 except ExtractorError as e:
3d2623a8 72 if isinstance(e.cause, HTTPError) and e.cause.status == 403:
0d08bcdb 73 entitlement_issues = self._parse_json(
3d2623a8 74 e.cause.response.read().decode(), video_id)['entitlementIssues']
0d08bcdb
RA
75 for e in entitlement_issues:
76 if e.get('errorCode') == 1005:
77 raise ExtractorError(
78 'This video is only available via cable service provider '
79 'subscription. You may want to use --cookies.', expected=True)
80 messages = ', '.join([e['message'] for e in entitlement_issues])
81 raise ExtractorError(messages, expected=True)
82 raise
96c186e1 83
41c2c254 84 def _real_initialize(self):
6df196f3
RA
85 if not self._access_token:
86 mvpd_auth = self._get_cookies(self._HOME_PAGE_URL).get('mvpd-auth')
87 if mvpd_auth:
add96eb9 88 self._access_token = (self._parse_json(urllib.parse.unquote(
6df196f3
RA
89 mvpd_auth.value), None, fatal=False) or {}).get('accessToken')
90 if not self._access_token:
91 self._access_token = self._call_api(
92 'login', None, json.dumps({
443f8de8 93 'deviceId': self._device_id,
6df196f3 94 }).encode())['accessToken']
9787c5f4 95
96 def _real_extract(self, url):
97 video_id = self._match_id(url)
7aa0ee32 98
443f8de8 99 self._access_token = self._call_api(
add96eb9 100 f'previewpassmvpd?device_id={self._device_id}&mvpd_id=TempPass_fbcfox_60min',
443f8de8 101 video_id)['accessToken']
102
103 video = self._call_api('watch', video_id, data=json.dumps({
104 'capabilities': ['drm/widevine', 'fsdk/yo'],
105 'deviceWidth': 1280,
106 'deviceHeight': 720,
107 'maxRes': '720p',
108 'os': 'macos',
109 'osv': '',
110 'provider': {
111 'freewheel': {'did': self._device_id},
112 'vdms': {'rays': ''},
add96eb9 113 'dmp': {'kuid': '', 'seg': ''},
443f8de8 114 },
115 'playlist': '',
116 'privacy': {'us': '1---'},
117 'siteSection': '',
118 'streamType': 'vod',
add96eb9 119 'streamId': video_id}).encode())
bf6ec2fe
S
120
121 title = video['name']
41c2c254 122 release_url = video['url']
443f8de8 123
0d08bcdb
RA
124 try:
125 m3u8_url = self._download_json(release_url, video_id)['playURL']
126 except ExtractorError as e:
3d2623a8 127 if isinstance(e.cause, HTTPError) and e.cause.status == 403:
128 error = self._parse_json(e.cause.response.read().decode(), video_id)
0d08bcdb
RA
129 if error.get('exception') == 'GeoLocationBlocked':
130 self.raise_geo_restricted(countries=['US'])
131 raise ExtractorError(error['description'], expected=True)
132 raise
96c186e1
RA
133 formats = self._extract_m3u8_formats(
134 m3u8_url, video_id, 'mp4',
135 entry_protocol='m3u8_native', m3u8_id='hls')
96c186e1 136
6df196f3
RA
137 data = try_get(
138 video, lambda x: x['trackingData']['properties'], dict) or {}
139
96c186e1
RA
140 duration = int_or_none(video.get('durationInSeconds')) or int_or_none(
141 video.get('duration')) or parse_duration(video.get('duration'))
142 timestamp = unified_timestamp(video.get('datePublished'))
143 creator = data.get('brand') or data.get('network') or video.get('network')
144 series = video.get('seriesName') or data.get(
145 'seriesName') or data.get('show')
684ae102
RA
146
147 subtitles = {}
148 for doc_rel in video.get('documentReleases', []):
149 rel_url = doc_rel.get('url')
150 if not url or doc_rel.get('format') != 'SCC':
151 continue
152 subtitles['en'] = [{
153 'url': rel_url,
154 'ext': 'scc',
155 }]
156 break
bf6ec2fe 157
96c186e1 158 return {
bf6ec2fe
S
159 'id': video_id,
160 'title': title,
96c186e1
RA
161 'formats': formats,
162 'description': video.get('description'),
bf6ec2fe
S
163 'duration': duration,
164 'timestamp': timestamp,
6df196f3 165 'age_limit': parse_age_limit(video.get('contentRating')),
bf6ec2fe
S
166 'creator': creator,
167 'series': series,
96c186e1
RA
168 'season_number': int_or_none(video.get('seasonNumber')),
169 'episode': video.get('name'),
170 'episode_number': int_or_none(video.get('episodeNumber')),
42a44f01 171 'thumbnail': traverse_obj(video, ('images', 'still', 'raw'), expected_type=url_or_none),
96c186e1 172 'release_year': int_or_none(video.get('releaseYear')),
684ae102 173 'subtitles': subtitles,
bf6ec2fe 174 }