]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/byutv.py
[ie/orf:on] Improve extraction (#9677)
[yt-dlp.git] / yt_dlp / extractor / byutv.py
CommitLineData
6949d810 1from .common import InfoExtractor
df63cafe
S
2from ..utils import (
3 determine_ext,
4 merge_dicts,
5 parse_duration,
6 url_or_none,
7)
6949d810
PH
8
9
10class BYUtvIE(InfoExtractor):
9751a457 11 _WORKING = False
c8be7d5f 12 _VALID_URL = r'https?://(?:www\.)?byutv\.org/(?:watch|player)/(?!event/)(?P<id>[0-9a-f-]+)(?:/(?P<display_id>[^/?#&]+))?'
6d2549fb 13 _TESTS = [{
7009a904 14 'url': 'http://www.byutv.org/watch/6587b9a3-89d2-42a6-a7f7-fd2f81840a7d/studio-c-season-5-episode-5',
6949d810 15 'info_dict': {
c8be7d5f 16 'id': 'ZvanRocTpW-G5_yZFeltTAMv6jxOU9KH',
6d2549fb 17 'display_id': 'studio-c-season-5-episode-5',
6949d810 18 'ext': 'mp4',
7009a904 19 'title': 'Season 5 Episode 5',
c8be7d5f
S
20 'description': 'md5:1d31dc18ef4f075b28f6a65937d22c65',
21 'thumbnail': r're:^https?://.*',
53e06b25 22 'duration': 1486.486,
6949d810 23 },
688c634b 24 'params': {
25 'skip_download': True,
26 },
ab116745 27 }, {
0db2b275
S
28 # dvr
29 'url': 'https://www.byutv.org/player/8f1dab9b-b243-47c8-b525-3e2d021a3451/byu-softball-pacific-vs-byu-41219---game-2',
ab116745 30 'info_dict': {
0db2b275
S
31 'id': '8f1dab9b-b243-47c8-b525-3e2d021a3451',
32 'display_id': 'byu-softball-pacific-vs-byu-41219---game-2',
ab116745 33 'ext': 'mp4',
0db2b275
S
34 'title': 'Pacific vs. BYU (4/12/19)',
35 'description': 'md5:1ac7b57cb9a78015910a4834790ce1f3',
36 'duration': 11645,
ab116745
MT
37 },
38 'params': {
39 'skip_download': True
40 },
6d2549fb
S
41 }, {
42 'url': 'http://www.byutv.org/watch/6587b9a3-89d2-42a6-a7f7-fd2f81840a7d',
43 'only_matching': True,
c8be7d5f
S
44 }, {
45 'url': 'https://www.byutv.org/player/27741493-dc83-40b0-8420-e7ae38a2ae98/byu-football-toledo-vs-byu-93016?listid=4fe0fee5-0d3c-4a29-b725-e4948627f472&listindex=0&q=toledo',
46 'only_matching': True,
6d2549fb 47 }]
6949d810
PH
48
49 def _real_extract(self, url):
5ad28e7f 50 mobj = self._match_valid_url(url)
6d2549fb 51 video_id = mobj.group('id')
0db2b275 52 display_id = mobj.group('display_id') or video_id
6949d810 53
df63cafe 54 video = self._download_json(
0db2b275
S
55 'https://api.byutv.org/api3/catalog/getvideosforcontent',
56 display_id, query={
c8be7d5f 57 'contentid': video_id,
6bf9c28b
RA
58 'channel': 'byutv',
59 'x-byutv-context': 'web$US',
c8be7d5f 60 }, headers={
6bf9c28b 61 'x-byutv-context': 'web$US',
c8be7d5f 62 'x-byutv-platformkey': 'xsaaw9c7y5',
ab116745 63 })
6d2549fb 64
df63cafe
S
65 info = {}
66 formats = []
64a5cf79 67 subtitles = {}
df63cafe
S
68 for format_id, ep in video.items():
69 if not isinstance(ep, dict):
70 continue
71 video_url = url_or_none(ep.get('videoUrl'))
72 if not video_url:
73 continue
74 ext = determine_ext(video_url)
75 if ext == 'm3u8':
64a5cf79 76 m3u8_fmts, m3u8_subs = self._extract_m3u8_formats_and_subtitles(
df63cafe 77 video_url, video_id, 'mp4', entry_protocol='m3u8_native',
64a5cf79
F
78 m3u8_id='hls', fatal=False)
79 formats.extend(m3u8_fmts)
80 subtitles = self._merge_subtitles(subtitles, m3u8_subs)
df63cafe 81 elif ext == 'mpd':
64a5cf79
F
82 mpd_fmts, mpd_subs = self._extract_mpd_formats_and_subtitles(
83 video_url, video_id, mpd_id='dash', fatal=False)
84 formats.extend(mpd_fmts)
85 subtitles = self._merge_subtitles(subtitles, mpd_subs)
df63cafe
S
86 else:
87 formats.append({
88 'url': video_url,
89 'format_id': format_id,
90 })
91 merge_dicts(info, {
92 'title': ep.get('title'),
93 'description': ep.get('description'),
94 'thumbnail': ep.get('imageThumbnail'),
95 'duration': parse_duration(ep.get('length')),
96 })
df63cafe
S
97
98 return merge_dicts(info, {
0db2b275
S
99 'id': video_id,
100 'display_id': display_id,
df63cafe 101 'title': display_id,
0db2b275 102 'formats': formats,
64a5cf79 103 'subtitles': subtitles,
df63cafe 104 })