Skip to content

Commit

Permalink
[ie/MLBArticle] Fix extractor (#9021)
Browse files Browse the repository at this point in the history
Closes #8682
Authored by: HobbyistDev
  • Loading branch information
HobbyistDev authored Jan 19, 2024
1 parent 4310b66 commit 50e06e2
Showing 1 changed file with 8 additions and 10 deletions.
18 changes: 8 additions & 10 deletions yt_dlp/extractor/mlb.py
Original file line number Diff line number Diff line change
Expand Up @@ -355,27 +355,25 @@ class MLBArticleIE(InfoExtractor):
'info_dict': {
'id': '36db7394-343c-4ea3-b8ca-ead2e61bca9a',
'title': 'Machado\'s grab draws hilarious irate reaction',
'modified_timestamp': 1650130737,
'modified_timestamp': 1675888370,
'description': 'md5:a19d4eb0487b2cb304e9a176f6b67676',
'modified_date': '20220416',
'modified_date': '20230208',
},
'playlist_count': 2,
'playlist_mincount': 2,
}]

def _real_extract(self, url):
display_id = self._match_id(url)
webpage = self._download_webpage(url, display_id)
apollo_cache_json = self._search_json(r'window\.initState\s*=', webpage, 'window.initState', display_id)['apolloCache']

content_data_id = traverse_obj(
apollo_cache_json, ('ROOT_QUERY', lambda k, _: k.startswith('getForgeContent'), 'id'), get_all=False)

content_real_info = apollo_cache_json[content_data_id]
content_real_info = traverse_obj(
apollo_cache_json, ('ROOT_QUERY', lambda k, _: k.startswith('getArticle')), get_all=False)

return self.playlist_from_matches(
traverse_obj(content_real_info, ('parts', lambda _, v: v['typename'] == 'Video', 'id')),
getter=lambda x: f'https://www.mlb.com/video/{apollo_cache_json[x]["slug"]}',
ie=MLBVideoIE, playlist_id=content_real_info.get('_translationId'),
traverse_obj(content_real_info, ('parts', lambda _, v: v['__typename'] == 'Video' or v['type'] == 'video')),
getter=lambda x: f'https://www.mlb.com/video/{x["slug"]}',
ie=MLBVideoIE, playlist_id=content_real_info.get('translationId'),
title=self._html_search_meta('og:title', webpage),
description=content_real_info.get('summary'),
modified_timestamp=parse_iso8601(content_real_info.get('lastUpdatedDate')))

0 comments on commit 50e06e2

Please sign in to comment.