]> jfr.im git - yt-dlp.git/blob - yt_dlp/extractor/philharmoniedeparis.py
[ie/orf:on] Improve extraction (#9677)
[yt-dlp.git] / yt_dlp / extractor / philharmoniedeparis.py
1 from .common import InfoExtractor
2 from ..compat import compat_str
3 from ..utils import try_get
4
5
6 class PhilharmonieDeParisIE(InfoExtractor):
7 IE_DESC = 'Philharmonie de Paris'
8 _VALID_URL = r'''(?x)
9 https?://
10 (?:
11 live\.philharmoniedeparis\.fr/(?:[Cc]oncert/|embed(?:app)?/|misc/Playlist\.ashx\?id=)|
12 pad\.philharmoniedeparis\.fr/(?:doc/CIMU/|player\.aspx\?id=)|
13 philharmoniedeparis\.fr/fr/live/concert/|
14 otoplayer\.philharmoniedeparis\.fr/fr/embed/
15 )
16 (?P<id>\d+)
17 '''
18 _TESTS = [{
19 'url': 'https://philharmoniedeparis.fr/fr/live/concert/1129666-danses-symphoniques',
20 'md5': '24bdb7e86c200c107680e1f7770330ae',
21 'info_dict': {
22 'id': '1129666',
23 'ext': 'mp4',
24 'title': 'Danses symphoniques. Orchestre symphonique Divertimento - Zahia Ziouani. Bizet, de Falla, Stravinski, Moussorgski, Saint-Saëns',
25 },
26 }, {
27 'url': 'https://philharmoniedeparis.fr/fr/live/concert/1032066-akademie-fur-alte-musik-berlin-rias-kammerchor-rene-jacobs-passion-selon-saint-jean-de-johann',
28 'info_dict': {
29 'id': '1032066',
30 'title': 'Akademie für alte Musik Berlin, Rias Kammerchor, René Jacobs : Passion selon saint Jean de Johann Sebastian Bach',
31 },
32 'playlist_mincount': 2,
33 }, {
34 'url': 'https://philharmoniedeparis.fr/fr/live/concert/1030324-orchestre-philharmonique-de-radio-france-myung-whun-chung-renaud-capucon-pascal-dusapin-johannes',
35 'only_matching': True,
36 }, {
37 'url': 'http://live.philharmoniedeparis.fr/misc/Playlist.ashx?id=1030324&track=&lang=fr',
38 'only_matching': True,
39 }, {
40 'url': 'https://live.philharmoniedeparis.fr/embedapp/1098406/berlioz-fantastique-lelio-les-siecles-national-youth-choir-of.html?lang=fr-FR',
41 'only_matching': True,
42 }, {
43 'url': 'https://otoplayer.philharmoniedeparis.fr/fr/embed/1098406?lang=fr-FR',
44 'only_matching': True,
45 }]
46
47 def _real_extract(self, url):
48 video_id = self._match_id(url)
49
50 config = self._download_json(
51 'https://otoplayer.philharmoniedeparis.fr/fr/config/%s.json' % video_id, video_id, query={
52 'id': video_id,
53 'lang': 'fr-FR',
54 })
55
56 def extract_entry(source):
57 if not isinstance(source, dict):
58 return
59 title = source.get('title')
60 if not title:
61 return
62 files = source.get('files')
63 if not isinstance(files, dict):
64 return
65 format_urls = set()
66 formats = []
67 for format_id in ('mobile', 'desktop'):
68 format_url = try_get(
69 files, lambda x: x[format_id]['file'], compat_str)
70 if not format_url or format_url in format_urls:
71 continue
72 format_urls.add(format_url)
73 formats.extend(self._extract_m3u8_formats(
74 format_url, video_id, 'mp4', entry_protocol='m3u8_native',
75 m3u8_id='hls', fatal=False))
76 if not formats and not self.get_param('ignore_no_formats'):
77 return
78 return {
79 'title': title,
80 'formats': formats,
81 'thumbnail': files.get('thumbnail'),
82 }
83 info = extract_entry(config)
84 if info:
85 info.update({
86 'id': video_id,
87 })
88 return info
89 entries = []
90 for num, chapter in enumerate(config['chapters'], start=1):
91 entry = extract_entry(chapter)
92 if entry is None:
93 continue
94 entry['id'] = '%s-%d' % (video_id, num)
95 entries.append(entry)
96
97 return self.playlist_result(entries, video_id, config.get('title'))