[extractors] Use new framework for existing embeds (#4307)

[yt-dlp.git] / yt_dlp / extractor / threeqsdn.py
diff --git a/yt_dlp/extractor/threeqsdn.py b/yt_dlp/extractor/threeqsdn.py

index bb7610352d58fdea9b51b86a7fe989c0a1d44b3e..a313a8dfbe6332a0b9c94d6cdf8fdd940777b0a7 100644 (file)
--- a/yt_dlp/extractor/threeqsdn.py
+++ b/yt_dlp/extractor/threeqsdn.py
@@ -1,7 +1,3 @@
-from __future__ import unicode_literals
-
-import re
-
  from .common import InfoExtractor
  from ..compat import compat_HTTPError
  from ..utils import (
@@ -9,6 +5,7 @@
      ExtractorError,
      float_or_none,
      int_or_none,
+    join_nonempty,
      parse_iso8601,
  )
  
@@ -17,6 +14,7 @@ class ThreeQSDNIE(InfoExtractor):
      IE_NAME = '3qsdn'
      IE_DESC = '3Q SDN'
      _VALID_URL = r'https?://playout\.3qsdn\.com/(?P<id>[\da-f]{8}-[\da-f]{4}-[\da-f]{4}-[\da-f]{4}-[\da-f]{12})'
+    _EMBED_REGEX = [r'<iframe[^>]+\b(?:data-)?src=(["\'])(?P<url>%s.*?)\1' % _VALID_URL]
      _TESTS = [{
          # https://player.3qsdn.com/demo.html
          'url': 'https://playout.3qsdn.com/7201c779-6b3c-11e7-a40e-002590c750be',
@@ -77,12 +75,13 @@ class ThreeQSDNIE(InfoExtractor):
          'only_matching': True,
      }]
  
-    @staticmethod
-    def _extract_url(webpage):
-        mobj = re.search(
-            r'<iframe[^>]+\b(?:data-)?src=(["\'])(?P<url>%s.*?)\1' % ThreeQSDNIE._VALID_URL, webpage)
-        if mobj:
-            return mobj.group('url')
+    def _extract_from_webpage(self, url, webpage):
+        for res in super()._extract_from_webpage(url, webpage):
+            yield {
+                **res,
+                '_type': 'url_transparent',
+                'uploader': self._search_regex(r'^(?:https?://)?([^/]*)/.*', url, 'video uploader'),
+            }
  
      def _real_extract(self, url):
          video_id = self._match_id(url)
@@ -110,8 +109,7 @@ def _real_extract(self, url):
                  subtitles = self._merge_subtitles(subtitles, subs)
              elif source_type == 'hls':
                  fmts, subs = self._extract_m3u8_formats_and_subtitles(
-                    source, video_id, 'mp4', 'm3u8' if live else 'm3u8_native',
-                    m3u8_id='hls', fatal=False)
+                    source, video_id, 'mp4', live=live, m3u8_id='hls', fatal=False)
                  formats.extend(fmts)
                  subtitles = self._merge_subtitles(subtitles, subs)
              elif source_type == 'progressive':
@@ -119,24 +117,16 @@ def _real_extract(self, url):
                      src = s.get('src')
                      if not (src and self._is_valid_url(src, video_id)):
                          continue
-                    width = None
-                    format_id = ['http']
                      ext = determine_ext(src)
-                    if ext:
-                        format_id.append(ext)
                      height = int_or_none(s.get('height'))
-                    if height:
-                        format_id.append('%dp' % height)
-                        if aspect:
-                            width = int(height * aspect)
                      formats.append({
                          'ext': ext,
-                        'format_id': '-'.join(format_id),
+                        'format_id': join_nonempty('http', ext, height and '%dp' % height),
                          'height': height,
                          'source_preference': 0,
                          'url': src,
                          'vcodec': 'none' if height == 0 else None,
-                        'width': width,
+                        'width': int(height * aspect) if height and aspect else None,
                      })
          # It seems like this would be correctly handled by default
          # However, unless someone can confirm this, the old
@@ -155,7 +145,7 @@ def _real_extract(self, url):
  
          return {
              'id': video_id,
-            'title': self._live_title(title) if live else title,
+            'title': title,
              'thumbnail': config.get('poster') or None,
              'description': config.get('description') or None,
              'timestamp': parse_iso8601(config.get('upload_date')),