[ie/crunchyroll] Fix stream extraction (#10005)

[yt-dlp.git] / yt_dlp / extractor / tv2dk.py
diff --git a/yt_dlp/extractor/tv2dk.py b/yt_dlp/extractor/tv2dk.py

index 8bda9348d723073b894d2d77b6556b51d89dad80..35e92f10c4dffeb486b0cf3511faee8a019d0f20 100644 (file)
--- a/yt_dlp/extractor/tv2dk.py
+++ b/yt_dlp/extractor/tv2dk.py
@@ -1,6 +1,3 @@
-# coding: utf-8
-from __future__ import unicode_literals
-
  import json
  import re
  
@@ -41,8 +38,16 @@ class TV2DKIE(InfoExtractor):
              'duration': 1347,
              'view_count': int,
          },
-        'params': {
-            'skip_download': True,
+        'add_ie': ['Kaltura'],
+    }, {
+        'url': 'https://www.tv2lorry.dk/gadekamp/gadekamp-6-hoejhuse-i-koebenhavn',
+        'info_dict': {
+            'id': '1_7iwll9n0',
+            'ext': 'mp4',
+            'upload_date': '20211027',
+            'title': 'Gadekamp #6 - Højhuse i København',
+            'uploader_id': 'tv2lorry',
+            'timestamp': 1635345229,
          },
          'add_ie': ['Kaltura'],
      }, {
@@ -74,6 +79,12 @@ def _real_extract(self, url):
          webpage = self._download_webpage(url, video_id)
  
          entries = []
+
+        def add_entry(partner_id, kaltura_id):
+            entries.append(self.url_result(
+                'kaltura:%s:%s' % (partner_id, kaltura_id), 'Kaltura',
+                video_id=kaltura_id))
+
          for video_el in re.findall(r'(?s)<[^>]+\bdata-entryid\s*=[^>]*>', webpage):
              video = extract_attributes(video_el)
              kaltura_id = video.get('data-entryid')
@@ -82,9 +93,17 @@ def _real_extract(self, url):
              partner_id = video.get('data-partnerid')
              if not partner_id:
                  continue
-            entries.append(self.url_result(
-                'kaltura:%s:%s' % (partner_id, kaltura_id), 'Kaltura',
-                video_id=kaltura_id))
+            add_entry(partner_id, kaltura_id)
+        if not entries:
+            kaltura_id = self._search_regex(
+                (r'entry_id\s*:\s*["\']([0-9a-z_]+)',
+                 r'\\u002FentryId\\u002F(\w+)\\u002F'), webpage, 'kaltura id')
+            partner_id = self._search_regex(
+                (r'\\u002Fp\\u002F(\d+)\\u002F', r'/p/(\d+)/'), webpage,
+                'partner id')
+            add_entry(partner_id, kaltura_id)
+        if len(entries) == 1:
+            return entries[0]
          return self.playlist_result(entries)
  
  
@@ -145,7 +164,6 @@ def _real_extract(self, url):
                  formats.append({
                      'url': src,
                  })
-        self._sort_formats(formats)
  
          return {
              'id': video_id,