[ie/MLBArticle] Fix extractor (#9021)

author HobbyistDev <redacted>

Fri, 19 Jan 2024 20:31:06 +0000 (05:31 +0900)

committer GitHub <redacted>

Fri, 19 Jan 2024 20:31:06 +0000 (20:31 +0000)
author HobbyistDev <redacted>
Fri, 19 Jan 2024 20:31:06 +0000 (05:31 +0900)
committer GitHub <redacted>
Fri, 19 Jan 2024 20:31:06 +0000 (20:31 +0000)
diff --git a/yt_dlp/extractor/mlb.py b/yt_dlp/extractor/mlb.py

index 72057dc97a0be14fdef0ffd6d104c00dfcfbec8e..d715b978920bb3c67bea8ab65f202da4f445e569 100644 (file)
--- a/yt_dlp/extractor/mlb.py
+++ b/yt_dlp/extractor/mlb.py
@@ -355,11 +355,11 @@ class MLBArticleIE(InfoExtractor):
          'info_dict': {
              'id': '36db7394-343c-4ea3-b8ca-ead2e61bca9a',
              'title': 'Machado\'s grab draws hilarious irate reaction',
-            'modified_timestamp': 1650130737,
+            'modified_timestamp': 1675888370,
              'description': 'md5:a19d4eb0487b2cb304e9a176f6b67676',
-            'modified_date': '20220416',
+            'modified_date': '20230208',
          },
-        'playlist_count': 2,
+        'playlist_mincount': 2,
      }]
  
      def _real_extract(self, url):
@@ -367,15 +367,13 @@ def _real_extract(self, url):
          webpage = self._download_webpage(url, display_id)
          apollo_cache_json = self._search_json(r'window\.initState\s*=', webpage, 'window.initState', display_id)['apolloCache']
  
-        content_data_id = traverse_obj(
-            apollo_cache_json, ('ROOT_QUERY', lambda k, _: k.startswith('getForgeContent'), 'id'), get_all=False)
-
-        content_real_info = apollo_cache_json[content_data_id]
+        content_real_info = traverse_obj(
+            apollo_cache_json, ('ROOT_QUERY', lambda k, _: k.startswith('getArticle')), get_all=False)
  
          return self.playlist_from_matches(
-            traverse_obj(content_real_info, ('parts', lambda _, v: v['typename'] == 'Video', 'id')),
-            getter=lambda x: f'https://www.mlb.com/video/{apollo_cache_json[x]["slug"]}',
-            ie=MLBVideoIE, playlist_id=content_real_info.get('_translationId'),
+            traverse_obj(content_real_info, ('parts', lambda _, v: v['__typename'] == 'Video' or v['type'] == 'video')),
+            getter=lambda x: f'https://www.mlb.com/video/{x["slug"]}',
+            ie=MLBVideoIE, playlist_id=content_real_info.get('translationId'),
              title=self._html_search_meta('og:title', webpage),
              description=content_real_info.get('summary'),
              modified_timestamp=parse_iso8601(content_real_info.get('lastUpdatedDate')))
author	HobbyistDev <redacted>
	Fri, 19 Jan 2024 20:31:06 +0000 (05:31 +0900)
committer	GitHub <redacted>
	Fri, 19 Jan 2024 20:31:06 +0000 (20:31 +0000)