[ie/crunchyroll] Fix stream extraction (#10005)

[yt-dlp.git] / yt_dlp / extractor / aenetworks.py
diff --git a/yt_dlp/extractor/aenetworks.py b/yt_dlp/extractor/aenetworks.py

index e55c03fd701a4f098c325df12baa64816b903678..ab4b6c0ebc958ac05c4e61d6ae5914fd172bbda0 100644 (file)
--- a/yt_dlp/extractor/aenetworks.py
+++ b/yt_dlp/extractor/aenetworks.py
@@ -1,27 +1,24 @@
-# coding: utf-8
-from __future__ import unicode_literals
-
-import re
-
  from .theplatform import ThePlatformIE
  from ..utils import (
      ExtractorError,
      GeoRestrictedError,
      int_or_none,
+    remove_start,
+    traverse_obj,
      update_url_query,
      urlencode_postdata,
  )
  
  
-class AENetworksBaseIE(ThePlatformIE):
+class AENetworksBaseIE(ThePlatformIE):  # XXX: Do not subclass from concrete IE
      _BASE_URL_REGEX = r'''(?x)https?://
          (?:(?:www|play|watch)\.)?
          (?P<domain>
              (?:history(?:vault)?|aetv|mylifetime|lifetimemovieclub)\.com|
              fyi\.tv
          )/'''
-    _THEPLATFORM_KEY = 'crazyjava'
-    _THEPLATFORM_SECRET = 's3cr3t'
+    _THEPLATFORM_KEY = '43jXaGRQud'
+    _THEPLATFORM_SECRET = 'S10BPXHMlb'
      _DOMAIN_MAP = {
          'history.com': ('HISTORY', 'history'),
          'aetv.com': ('AETV', 'aetv'),
@@ -33,14 +30,17 @@ class AENetworksBaseIE(ThePlatformIE):
      }
  
      def _extract_aen_smil(self, smil_url, video_id, auth=None):
-        query = {'mbr': 'true'}
+        query = {
+            'mbr': 'true',
+            'formats': 'M3U+none,MPEG-DASH+none,MPEG4,MP3',
+        }
          if auth:
              query['auth'] = auth
          TP_SMIL_QUERY = [{
              'assetTypes': 'high_video_ak',
-            'switch': 'hls_high_ak'
+            'switch': 'hls_high_ak',
          }, {
-            'assetTypes': 'high_video_s3'
+            'assetTypes': 'high_video_s3',
          }, {
              'assetTypes': 'high_video_s3',
              'switch': 'hls_high_fastly',
@@ -64,7 +64,6 @@ def _extract_aen_smil(self, smil_url, video_id, auth=None):
              subtitles = self._merge_subtitles(subtitles, tp_subtitles)
          if last_e and not formats:
              raise last_e
-        self._sort_formats(formats)
          return {
              'id': video_id,
              'formats': formats,
@@ -75,7 +74,14 @@ def _extract_aetn_info(self, domain, filter_key, filter_value, url):
          requestor_id, brand = self._DOMAIN_MAP[domain]
          result = self._download_json(
              'https://feeds.video.aetnd.com/api/v2/%s/videos' % brand,
-            filter_value, query={'filter[%s]' % filter_key: filter_value})['results'][0]
+            filter_value, query={'filter[%s]' % filter_key: filter_value})
+        result = traverse_obj(
+            result, ('results',
+                     lambda k, v: k == 0 and v[filter_key] == filter_value),
+            get_all=False)
+        if not result:
+            raise ExtractorError('Show not found in A&E feed (too new?)', expected=True,
+                                 video_id=remove_start(filter_value, '/'))
          title = result['title']
          video_id = result['id']
          media_url = result['publicUrl']
@@ -87,7 +93,7 @@ def _extract_aetn_info(self, domain, filter_key, filter_value, url):
              resource = self._get_mvpd_resource(
                  requestor_id, theplatform_metadata['title'],
                  theplatform_metadata.get('AETN$PPL_pplProgramId') or theplatform_metadata.get('AETN$PPL_pplProgramId_OLD'),
-                theplatform_metadata['ratings'][0]['rating'])
+                traverse_obj(theplatform_metadata, ('ratings', 0, 'rating')))
              auth = self._extract_mvpd_auth(
                  url, video_id, requestor_id, resource)
          info.update(self._extract_aen_smil(media_url, video_id, auth))
@@ -115,18 +121,28 @@ class AENetworksIE(AENetworksBaseIE):
          'info_dict': {
              'id': '22253814',
              'ext': 'mp4',
-            'title': 'Winter is Coming',
-            'description': 'md5:641f424b7a19d8e24f26dea22cf59d74',
+            'title': 'Winter Is Coming',
+            'description': 'md5:a40e370925074260b1c8a633c632c63a',
              'timestamp': 1338306241,
              'upload_date': '20120529',
              'uploader': 'AENE-NEW',
+            'duration': 2592.0,
+            'thumbnail': r're:^https?://.*\.jpe?g$',
+            'chapters': 'count:5',
+            'tags': 'count:14',
+            'categories': ['Mountain Men'],
+            'episode_number': 1,
+            'episode': 'Episode 1',
+            'season': 'Season 1',
+            'season_number': 1,
+            'series': 'Mountain Men',
          },
          'params': {
              # m3u8 download
              'skip_download': True,
          },
          'add_ie': ['ThePlatform'],
-        'skip': 'This video is only available for users of participating TV providers.',
+        'skip': 'Geo-restricted - This content is not available in your location.'
      }, {
          'url': 'http://www.aetv.com/shows/duck-dynasty/season-9/episode-1',
          'info_dict': {
@@ -137,12 +153,22 @@ class AENetworksIE(AENetworksBaseIE):
              'timestamp': 1452634428,
              'upload_date': '20160112',
              'uploader': 'AENE-NEW',
+            'duration': 1277.695,
+            'thumbnail': r're:^https?://.*\.jpe?g$',
+            'chapters': 'count:4',
+            'tags': 'count:23',
+            'episode': 'Episode 1',
+            'episode_number': 1,
+            'season': 'Season 9',
+            'season_number': 9,
+            'series': 'Duck Dynasty',
          },
          'params': {
              # m3u8 download
              'skip_download': True,
          },
          'add_ie': ['ThePlatform'],
+        'skip': 'This video is only available for users of participating TV providers.',
      }, {
          'url': 'http://www.fyi.tv/shows/tiny-house-nation/season-1/episode-8',
          'only_matching': True
@@ -170,7 +196,7 @@ class AENetworksIE(AENetworksBaseIE):
      }]
  
      def _real_extract(self, url):
-        domain, canonical = re.match(self._VALID_URL, url).groups()
+        domain, canonical = self._match_valid_url(url).groups()
          return self._extract_aetn_info(domain, 'canonical', '/' + canonical, url)
  
  
@@ -187,7 +213,7 @@ def _call_api(self, resource, slug, brand, fields):
              }))['data'][resource]
  
      def _real_extract(self, url):
-        domain, slug = re.match(self._VALID_URL, url).groups()
+        domain, slug = self._match_valid_url(url).groups()
          _, brand = self._DOMAIN_MAP[domain]
          playlist = self._call_api(self._RESOURCE, slug, brand, self._FIELDS)
          base_url = 'http://watch.%s' % domain
@@ -309,7 +335,7 @@ class HistoryPlayerIE(AENetworksBaseIE):
      _TESTS = []
  
      def _real_extract(self, url):
-        domain, video_id = re.match(self._VALID_URL, url).groups()
+        domain, video_id = self._match_valid_url(url).groups()
          return self._extract_aetn_info(domain, 'id', video_id, url)
  
  
@@ -331,6 +357,7 @@ class BiographyIE(AENetworksBaseIE):
              'skip_download': True,
          },
          'add_ie': ['ThePlatform'],
+        'skip': '404 Not Found',
      }]
  
      def _real_extract(self, url):