mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2025-06-18 15:55:30 +02:00
77 lines
3.3 KiB
Python
77 lines
3.3 KiB
Python
from .common import InfoExtractor
|
|
from .youtube import YoutubeIE
|
|
from ..utils import (
|
|
clean_html,
|
|
parse_iso8601,
|
|
update_url,
|
|
url_or_none,
|
|
)
|
|
from ..utils.traversal import subs_list_to_dict, traverse_obj
|
|
|
|
|
|
class StarTrekIE(InfoExtractor):
|
|
IE_NAME = 'startrek'
|
|
IE_DESC = 'STAR TREK'
|
|
_VALID_URL = r'https?://(?:www\.)?startrek\.com(?:/en-(?:ca|un))?/videos/(?P<id>[^/?#]+)'
|
|
_TESTS = [{
|
|
'url': 'https://www.startrek.com/en-un/videos/official-trailer-star-trek-lower-decks-season-4',
|
|
'info_dict': {
|
|
'id': 'official-trailer-star-trek-lower-decks-season-4',
|
|
'ext': 'mp4',
|
|
'title': 'Official Trailer | Star Trek: Lower Decks - Season 4',
|
|
'alt_title': 'md5:dd7e3191aaaf9e95db16fc3abd5ef68b',
|
|
'categories': ['TRAILERS'],
|
|
'description': 'md5:563d7856ddab99bee7a5e50f45531757',
|
|
'release_date': '20230722',
|
|
'release_timestamp': 1690033200,
|
|
'series': 'Star Trek: Lower Decks',
|
|
'series_id': 'star-trek-lower-decks',
|
|
'thumbnail': r're:https?://.+\.(?:jpg|png)',
|
|
},
|
|
}, {
|
|
'url': 'https://www.startrek.com/en-ca/videos/my-first-contact-senator-cory-booker',
|
|
'info_dict': {
|
|
'id': 'my-first-contact-senator-cory-booker',
|
|
'ext': 'mp4',
|
|
'title': 'My First Contact: Senator Cory Booker',
|
|
'alt_title': 'md5:fe74a8bdb0afab421c6e159a7680db4d',
|
|
'categories': ['MY FIRST CONTACT'],
|
|
'description': 'md5:a3992ab3b3e0395925d71156bbc018ce',
|
|
'release_date': '20250401',
|
|
'release_timestamp': 1743512400,
|
|
'series': 'Star Trek: The Original Series',
|
|
'series_id': 'star-trek-the-original-series',
|
|
'thumbnail': r're:https?://.+\.(?:jpg|png)',
|
|
},
|
|
}]
|
|
|
|
def _real_extract(self, url):
|
|
video_id = self._match_id(url)
|
|
webpage = self._download_webpage(url, video_id)
|
|
|
|
page_props = self._search_nextjs_data(webpage, video_id)['props']['pageProps']
|
|
video_data = page_props['video']['data']
|
|
if youtube_id := video_data.get('youtube_video_id'):
|
|
return self.url_result(youtube_id, YoutubeIE)
|
|
|
|
series_id = traverse_obj(video_data, (
|
|
'series_and_movies', ..., 'series_or_movie', 'slug', {str}, any))
|
|
|
|
return {
|
|
'id': video_id,
|
|
'series': traverse_obj(page_props, (
|
|
'queried', 'header', 'tab3', 'slices', ..., 'items',
|
|
lambda _, v: v['link']['slug'] == series_id, 'link_copy', {str}, any)),
|
|
'series_id': series_id,
|
|
**traverse_obj(video_data, {
|
|
'title': ('title', ..., 'text', {clean_html}, any),
|
|
'alt_title': ('subhead', ..., 'text', {clean_html}, any),
|
|
'categories': ('category', 'data', 'category_name', {str.upper}, filter, all),
|
|
'description': ('slices', ..., 'primary', 'content', ..., 'text', {clean_html}, any),
|
|
'release_timestamp': ('published', {parse_iso8601}),
|
|
'subtitles': ({'url': 'legacy_subtitle_file'}, all, {subs_list_to_dict(lang='en')}),
|
|
'thumbnail': ('poster_frame', 'url', {url_or_none}, {update_url(query=None)}),
|
|
'url': ('legacy_video_url', {url_or_none}),
|
|
}),
|
|
}
|