]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/amcnetworks.py
[ie/youtube] Suppress "Unavailable videos are hidden" warning (#10159)
[yt-dlp.git] / yt_dlp / extractor / amcnetworks.py
CommitLineData
29f7c58a 1import re
2
b5ddee8c
RA
3from .theplatform import ThePlatformIE
4from ..utils import (
837e56c8 5 int_or_none,
9682666b
S
6 parse_age_limit,
7 try_get,
8 update_url_query,
b5ddee8c
RA
9)
10
11
6368e2e6 12class AMCNetworksIE(ThePlatformIE): # XXX: Do not subclass from concrete IE
29f7c58a 13 _VALID_URL = r'https?://(?:www\.)?(?P<site>amc|bbcamerica|ifc|(?:we|sundance)tv)\.com/(?P<id>(?:movies|shows(?:/[^/]+)+)/[^/?#&]+)'
b5ddee8c 14 _TESTS = [{
29f7c58a 15 'url': 'https://www.bbcamerica.com/shows/the-graham-norton-show/videos/tina-feys-adorable-airline-themed-family-dinner--51631',
b5ddee8c 16 'info_dict': {
29f7c58a 17 'id': '4Lq1dzOnZGt0',
b5ddee8c 18 'ext': 'mp4',
29f7c58a 19 'title': "The Graham Norton Show - Season 28 - Tina Fey's Adorable Airline-Themed Family Dinner",
20 'description': "It turns out child stewardesses are very generous with the wine! All-new episodes of 'The Graham Norton Show' premiere Fridays at 11/10c on BBC America.",
21 'upload_date': '20201120',
22 'timestamp': 1605904350,
b5ddee8c
RA
23 'uploader': 'AMCN',
24 },
25 'params': {
26 # m3u8 download
27 'skip_download': True,
28 },
19c90e40 29 'skip': '404 Not Found',
b5ddee8c
RA
30 }, {
31 'url': 'http://www.bbcamerica.com/shows/the-hunt/full-episodes/season-1/episode-01-the-hardest-challenge',
32 'only_matching': True,
33 }, {
34 'url': 'http://www.amc.com/shows/preacher/full-episodes/season-01/episode-00/pilot',
35 'only_matching': True,
36 }, {
37 'url': 'http://www.wetv.com/shows/million-dollar-matchmaker/season-01/episode-06-the-dumped-dj-and-shallow-hal',
38 'only_matching': True,
39 }, {
40 'url': 'http://www.ifc.com/movies/chaos',
41 'only_matching': True,
1d6ae562
YCH
42 }, {
43 'url': 'http://www.bbcamerica.com/shows/doctor-who/full-episodes/the-power-of-the-daleks/episode-01-episode-1-color-version',
44 'only_matching': True,
231bcd0b
S
45 }, {
46 'url': 'http://www.wetv.com/shows/mama-june-from-not-to-hot/full-episode/season-01/thin-tervention',
47 'only_matching': True,
48 }, {
49 'url': 'http://www.wetv.com/shows/la-hair/videos/season-05/episode-09-episode-9-2/episode-9-sneak-peek-3',
50 'only_matching': True,
466000fc
RA
51 }, {
52 'url': 'https://www.sundancetv.com/shows/riviera/full-episodes/season-1/episode-01-episode-1',
53 'only_matching': True,
b5ddee8c 54 }]
29f7c58a 55 _REQUESTOR_ID_MAP = {
56 'amc': 'AMC',
57 'bbcamerica': 'BBCA',
58 'ifc': 'IFC',
59 'sundancetv': 'SUNDANCE',
60 'wetv': 'WETV',
61 }
b5ddee8c
RA
62
63 def _real_extract(self, url):
5ad28e7f 64 site, display_id = self._match_valid_url(url).groups()
29f7c58a 65 requestor_id = self._REQUESTOR_ID_MAP[site]
5c5fae6d 66 page_data = self._download_json(
add96eb9 67 f'https://content-delivery-gw.svc.ds.amcn.com/api/v2/content/amcn/{requestor_id.lower()}/url/{display_id}',
68 display_id)['data']
5c5fae6d 69 properties = page_data.get('properties') or {}
b5ddee8c
RA
70 query = {
71 'mbr': 'true',
72 'manifest': 'm3u',
73 }
5c5fae6d 74
75 video_player_count = 0
76 try:
77 for v in page_data['children']:
78 if v.get('type') == 'video-player':
add96eb9 79 release_pid = v['properties']['currentVideo']['meta']['releasePid']
80 tp_path = 'M_UwQC/' + release_pid
5c5fae6d 81 media_url = 'https://link.theplatform.com/s/' + tp_path
82 video_player_count += 1
83 except KeyError:
84 pass
85 if video_player_count > 1:
86 self.report_warning(
add96eb9 87 f'The JSON data has {video_player_count} video players. Only one will be extracted')
5c5fae6d 88
89 # Fall back to videoPid if releasePid not found.
90 # TODO: Fall back to videoPid if releasePid manifest uses DRM.
91 if not video_player_count:
92 tp_path = 'M_UwQC/media/' + properties['videoPid']
93 media_url = 'https://link.theplatform.com/s/' + tp_path
94
29f7c58a 95 theplatform_metadata = self._download_theplatform_metadata(tp_path, display_id)
b5ddee8c
RA
96 info = self._parse_theplatform_metadata(theplatform_metadata)
97 video_id = theplatform_metadata['pid']
98 title = theplatform_metadata['title']
9682666b
S
99 rating = try_get(
100 theplatform_metadata, lambda x: x['ratings'][0]['rating'])
29f7c58a 101 video_category = properties.get('videoCategory')
102 if video_category and video_category.endswith('-Auth'):
1bd05345
RA
103 resource = self._get_mvpd_resource(
104 requestor_id, title, video_id, rating)
105 query['auth'] = self._extract_mvpd_auth(
106 url, video_id, requestor_id, resource)
b5ddee8c 107 media_url = update_url_query(media_url, query)
1bd05345
RA
108 formats, subtitles = self._extract_theplatform_smil(
109 media_url, video_id)
5c5fae6d 110
111 thumbnails = []
112 thumbnail_urls = [properties.get('imageDesktop')]
113 if 'thumbnail' in info:
114 thumbnail_urls.append(info.pop('thumbnail'))
115 for thumbnail_url in thumbnail_urls:
116 if not thumbnail_url:
117 continue
118 mobj = re.search(r'(\d+)x(\d+)', thumbnail_url)
119 thumbnails.append({
120 'url': thumbnail_url,
121 'width': int(mobj.group(1)) if mobj else None,
122 'height': int(mobj.group(2)) if mobj else None,
123 })
124
b5ddee8c 125 info.update({
5c5fae6d 126 'age_limit': parse_age_limit(rating),
127 'formats': formats,
b5ddee8c 128 'id': video_id,
2cabee2a 129 'subtitles': subtitles,
5c5fae6d 130 'thumbnails': thumbnails,
b5ddee8c 131 })
837e56c8
RA
132 ns_keys = theplatform_metadata.get('$xmlns', {}).keys()
133 if ns_keys:
add96eb9 134 ns = next(iter(ns_keys))
5c5fae6d 135 episode = theplatform_metadata.get(ns + '$episodeTitle') or None
1bd05345
RA
136 episode_number = int_or_none(
137 theplatform_metadata.get(ns + '$episode'))
5c5fae6d 138 season_number = int_or_none(
139 theplatform_metadata.get(ns + '$season'))
140 series = theplatform_metadata.get(ns + '$show') or None
837e56c8 141 info.update({
837e56c8
RA
142 'episode': episode,
143 'episode_number': episode_number,
5c5fae6d 144 'season_number': season_number,
145 'series': series,
837e56c8 146 })
b5ddee8c 147 return info