From: FrankZ85 Date: Wed, 15 Nov 2023 22:38:52 +0000 (+0100) Subject: [ie/tv5mondeplus] Extract subtitles (#4209) X-Git-Tag: 2023.11.16~10 X-Git-Url: https://jfr.im/git/yt-dlp.git/commitdiff_plain/0f634dba3afdc429ece8839b02f6d56c27b7973a [ie/tv5mondeplus] Extract subtitles (#4209) Closes #4205 Authored by: FrankZ85 --- diff --git a/yt_dlp/extractor/tv5mondeplus.py b/yt_dlp/extractor/tv5mondeplus.py index 4da1b26d1..a445fae85 100644 --- a/yt_dlp/extractor/tv5mondeplus.py +++ b/yt_dlp/extractor/tv5mondeplus.py @@ -84,6 +84,13 @@ class TV5MondePlusIE(InfoExtractor): }] _GEO_BYPASS = False + @staticmethod + def _extract_subtitles(data_captions): + subtitles = {} + for f in traverse_obj(data_captions, ('files', lambda _, v: url_or_none(v['file']))): + subtitles.setdefault(f.get('label') or 'fra', []).append({'url': f['file']}) + return subtitles + def _real_extract(self, url): display_id = self._match_id(url) webpage = self._download_webpage(url, display_id) @@ -176,6 +183,8 @@ def process_video_files(v): 'duration': duration, 'upload_date': upload_date, 'formats': formats, + 'subtitles': self._extract_subtitles(self._parse_json( + traverse_obj(vpl_data, ('data-captions', {str}), default='{}'), display_id, fatal=False)), 'series': series, 'episode': episode, }