[zoom] Extract transcripts as subtitles

author pukkandan <redacted>

Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)

committer pukkandan <redacted>

Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)
author pukkandan <redacted>
Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)
committer pukkandan <redacted>
Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)
diff --git a/yt_dlp/extractor/zoom.py b/yt_dlp/extractor/zoom.py

index 6579f5ea4cd91fde41dd46751811bafb44559d3b..7accb6505caf96a607964c9eba5c34196cb65906 100644 (file)
--- a/yt_dlp/extractor/zoom.py
+++ b/yt_dlp/extractor/zoom.py
@@ -10,6 +10,7 @@
      js_to_json,
      parse_filesize,
      urlencode_postdata,
+    urljoin,
  )
  
  
@@ -55,10 +56,19 @@ def _real_extract(self, url):
              r'(?s)window\.__data__\s*=\s*({.+?});',
              webpage, 'data'), play_id, js_to_json)
  
+        subtitles = {}
+        for _type in ('transcript', 'cc'):
+            if data.get('%sUrl' % _type):
+                subtitles[_type] = [{
+                    'url': urljoin(base_url, data['%sUrl' % _type]),
+                    'ext': 'vtt',
+                }]
+
          return {
              'id': play_id,
              'title': data['topic'],
              'url': data['viewMp4Url'],
+            'subtitles': subtitles,
              'width': int_or_none(data.get('viewResolvtionsWidth')),
              'height': int_or_none(data.get('viewResolvtionsHeight')),
              'http_headers': {
author	pukkandan <redacted>
	Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)
committer	pukkandan <redacted>
	Sun, 6 Jun 2021 11:39:09 +0000 (17:09 +0530)