[ie/matchtv] Fix extractor (#10190)

[yt-dlp.git] / yt_dlp / extractor / aenetworks.py
diff --git a/yt_dlp/extractor/aenetworks.py b/yt_dlp/extractor/aenetworks.py

index 8025de5a3289d8f9a4f051d39e283691f31098fb..8e257865fb37d1c0482b54b7e26fc70ab4921c11 100644 (file)
--- a/yt_dlp/extractor/aenetworks.py
+++ b/yt_dlp/extractor/aenetworks.py
@@ -1,18 +1,16 @@
-# coding: utf-8
-from __future__ import unicode_literals
-
-
  from .theplatform import ThePlatformIE
  from ..utils import (
      ExtractorError,
      GeoRestrictedError,
      int_or_none,
+    remove_start,
+    traverse_obj,
      update_url_query,
      urlencode_postdata,
  )
  
  
-class AENetworksBaseIE(ThePlatformIE):
+class AENetworksBaseIE(ThePlatformIE):  # XXX: Do not subclass from concrete IE
      _BASE_URL_REGEX = r'''(?x)https?://
          (?:(?:www|play|watch)\.)?
          (?P<domain>
@@ -32,14 +30,17 @@ class AENetworksBaseIE(ThePlatformIE):
      }
  
      def _extract_aen_smil(self, smil_url, video_id, auth=None):
-        query = {'mbr': 'true'}
+        query = {
+            'mbr': 'true',
+            'formats': 'M3U+none,MPEG-DASH+none,MPEG4,MP3',
+        }
          if auth:
              query['auth'] = auth
          TP_SMIL_QUERY = [{
              'assetTypes': 'high_video_ak',
-            'switch': 'hls_high_ak'
+            'switch': 'hls_high_ak',
          }, {
-            'assetTypes': 'high_video_s3'
+            'assetTypes': 'high_video_s3',
          }, {
              'assetTypes': 'high_video_s3',
              'switch': 'hls_high_fastly',
@@ -63,7 +64,6 @@ def _extract_aen_smil(self, smil_url, video_id, auth=None):
              subtitles = self._merge_subtitles(subtitles, tp_subtitles)
          if last_e and not formats:
              raise last_e
-        self._sort_formats(formats)
          return {
              'id': video_id,
              'formats': formats,
@@ -73,8 +73,15 @@ def _extract_aen_smil(self, smil_url, video_id, auth=None):
      def _extract_aetn_info(self, domain, filter_key, filter_value, url):
          requestor_id, brand = self._DOMAIN_MAP[domain]
          result = self._download_json(
-            'https://feeds.video.aetnd.com/api/v2/%s/videos' % brand,
-            filter_value, query={'filter[%s]' % filter_key: filter_value})['results'][0]
+            f'https://feeds.video.aetnd.com/api/v2/{brand}/videos',
+            filter_value, query={f'filter[{filter_key}]': filter_value})
+        result = traverse_obj(
+            result, ('results',
+                     lambda k, v: k == 0 and v[filter_key] == filter_value),
+            get_all=False)
+        if not result:
+            raise ExtractorError('Show not found in A&E feed (too new?)', expected=True,
+                                 video_id=remove_start(filter_value, '/'))
          title = result['title']
          video_id = result['id']
          media_url = result['publicUrl']
@@ -86,7 +93,7 @@ def _extract_aetn_info(self, domain, filter_key, filter_value, url):
              resource = self._get_mvpd_resource(
                  requestor_id, theplatform_metadata['title'],
                  theplatform_metadata.get('AETN$PPL_pplProgramId') or theplatform_metadata.get('AETN$PPL_pplProgramId_OLD'),
-                theplatform_metadata['ratings'][0]['rating'])
+                traverse_obj(theplatform_metadata, ('ratings', 0, 'rating')))
              auth = self._extract_mvpd_auth(
                  url, video_id, requestor_id, resource)
          info.update(self._extract_aen_smil(media_url, video_id, auth))
@@ -114,18 +121,28 @@ class AENetworksIE(AENetworksBaseIE):
          'info_dict': {
              'id': '22253814',
              'ext': 'mp4',
-            'title': 'Winter is Coming',
-            'description': 'md5:641f424b7a19d8e24f26dea22cf59d74',
+            'title': 'Winter Is Coming',
+            'description': 'md5:a40e370925074260b1c8a633c632c63a',
              'timestamp': 1338306241,
              'upload_date': '20120529',
              'uploader': 'AENE-NEW',
+            'duration': 2592.0,
+            'thumbnail': r're:^https?://.*\.jpe?g$',
+            'chapters': 'count:5',
+            'tags': 'count:14',
+            'categories': ['Mountain Men'],
+            'episode_number': 1,
+            'episode': 'Episode 1',
+            'season': 'Season 1',
+            'season_number': 1,
+            'series': 'Mountain Men',
          },
          'params': {
              # m3u8 download
              'skip_download': True,
          },
          'add_ie': ['ThePlatform'],
-        'skip': 'This video is only available for users of participating TV providers.',
+        'skip': 'Geo-restricted - This content is not available in your location.',
      }, {
          'url': 'http://www.aetv.com/shows/duck-dynasty/season-9/episode-1',
          'info_dict': {
@@ -136,36 +153,46 @@ class AENetworksIE(AENetworksBaseIE):
              'timestamp': 1452634428,
              'upload_date': '20160112',
              'uploader': 'AENE-NEW',
+            'duration': 1277.695,
+            'thumbnail': r're:^https?://.*\.jpe?g$',
+            'chapters': 'count:4',
+            'tags': 'count:23',
+            'episode': 'Episode 1',
+            'episode_number': 1,
+            'season': 'Season 9',
+            'season_number': 9,
+            'series': 'Duck Dynasty',
          },
          'params': {
              # m3u8 download
              'skip_download': True,
          },
          'add_ie': ['ThePlatform'],
+        'skip': 'This video is only available for users of participating TV providers.',
      }, {
          'url': 'http://www.fyi.tv/shows/tiny-house-nation/season-1/episode-8',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'http://www.mylifetime.com/shows/project-runway-junior/season-1/episode-6',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'http://www.mylifetime.com/movies/center-stage-on-pointe/full-movie',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'https://watch.lifetimemovieclub.com/movies/10-year-reunion/full-movie',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'http://www.history.com/specials/sniper-into-the-kill-zone/full-special',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'https://www.aetv.com/specials/hunting-jonbenets-killer-the-untold-story/preview-hunting-jonbenets-killer-the-untold-story',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'http://www.history.com/videos/history-of-valentines-day',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'https://play.aetv.com/shows/duck-dynasty/videos/best-of-duck-dynasty-getting-quack-in-shape',
-        'only_matching': True
+        'only_matching': True,
      }]
  
      def _real_extract(self, url):
@@ -182,14 +209,14 @@ def _call_api(self, resource, slug, brand, fields):
    %s(slug: "%s") {
      %s
    }
-}''' % (resource, slug, fields),
+}''' % (resource, slug, fields),  # noqa: UP031
              }))['data'][resource]
  
      def _real_extract(self, url):
          domain, slug = self._match_valid_url(url).groups()
          _, brand = self._DOMAIN_MAP[domain]
          playlist = self._call_api(self._RESOURCE, slug, brand, self._FIELDS)
-        base_url = 'http://watch.%s' % domain
+        base_url = f'http://watch.{domain}'
  
          entries = []
          for item in (playlist.get(self._ITEMS_KEY) or []):
@@ -221,10 +248,10 @@ class AENetworksCollectionIE(AENetworksListBaseIE):
          'playlist_mincount': 12,
      }, {
          'url': 'https://watch.historyvault.com/shows/america-the-story-of-us-2/season-1/list/america-the-story-of-us',
-        'only_matching': True
+        'only_matching': True,
      }, {
          'url': 'https://www.historyvault.com/collections/mysteryquest',
-        'only_matching': True
+        'only_matching': True,
      }]
      _RESOURCE = 'list'
      _ITEMS_KEY = 'items'
@@ -282,7 +309,7 @@ class HistoryTopicIE(AENetworksBaseIE):
          'info_dict': {
              'id': '40700995724',
              'ext': 'mp4',
-            'title': "History of Valentine’s Day",
+            'title': 'History of Valentine’s Day',
              'description': 'md5:7b57ea4829b391995b405fa60bd7b5f7',
              'timestamp': 1375819729,
              'upload_date': '20130806',
@@ -330,12 +357,13 @@ class BiographyIE(AENetworksBaseIE):
              'skip_download': True,
          },
          'add_ie': ['ThePlatform'],
+        'skip': '404 Not Found',
      }]
  
      def _real_extract(self, url):
          display_id = self._match_id(url)
          webpage = self._download_webpage(url, display_id)
          player_url = self._search_regex(
-            r'<phoenix-iframe[^>]+src="(%s)' % HistoryPlayerIE._VALID_URL,
+            rf'<phoenix-iframe[^>]+src="({HistoryPlayerIE._VALID_URL})',
              webpage, 'player URL')
          return self.url_result(player_url, HistoryPlayerIE.ie_key())