]> jfr.im git - yt-dlp.git/commitdiff
[zoom] Extract transcripts as subtitles
authorpukkandan <redacted>
Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)
committerpukkandan <redacted>
Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)
yt_dlp/extractor/zoom.py

index 6579f5ea4cd91fde41dd46751811bafb44559d3b..7accb6505caf96a607964c9eba5c34196cb65906 100644 (file)
@@ -10,6 +10,7 @@
     js_to_json,
     parse_filesize,
     urlencode_postdata,
+    urljoin,
 )
 
 
@@ -55,10 +56,19 @@ def _real_extract(self, url):
             r'(?s)window\.__data__\s*=\s*({.+?});',
             webpage, 'data'), play_id, js_to_json)
 
+        subtitles = {}
+        for _type in ('transcript', 'cc'):
+            if data.get('%sUrl' % _type):
+                subtitles[_type] = [{
+                    'url': urljoin(base_url, data['%sUrl' % _type]),
+                    'ext': 'vtt',
+                }]
+
         return {
             'id': play_id,
             'title': data['topic'],
             'url': data['viewMp4Url'],
+            'subtitles': subtitles,
             'width': int_or_none(data.get('viewResolvtionsWidth')),
             'height': int_or_none(data.get('viewResolvtionsHeight')),
             'http_headers': {