mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-11-04 00:25:15 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			77 lines
		
	
	
		
			3.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			77 lines
		
	
	
		
			3.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
from .common import InfoExtractor
 | 
						|
from .youtube import YoutubeIE
 | 
						|
from ..utils import (
 | 
						|
    clean_html,
 | 
						|
    parse_iso8601,
 | 
						|
    update_url,
 | 
						|
    url_or_none,
 | 
						|
)
 | 
						|
from ..utils.traversal import subs_list_to_dict, traverse_obj
 | 
						|
 | 
						|
 | 
						|
class StarTrekIE(InfoExtractor):
 | 
						|
    IE_NAME = 'startrek'
 | 
						|
    IE_DESC = 'STAR TREK'
 | 
						|
    _VALID_URL = r'https?://(?:www\.)?startrek\.com(?:/en-(?:ca|un))?/videos/(?P<id>[^/?#]+)'
 | 
						|
    _TESTS = [{
 | 
						|
        'url': 'https://www.startrek.com/en-un/videos/official-trailer-star-trek-lower-decks-season-4',
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'official-trailer-star-trek-lower-decks-season-4',
 | 
						|
            'ext': 'mp4',
 | 
						|
            'title': 'Official Trailer | Star Trek: Lower Decks - Season 4',
 | 
						|
            'alt_title': 'md5:dd7e3191aaaf9e95db16fc3abd5ef68b',
 | 
						|
            'categories': ['TRAILERS'],
 | 
						|
            'description': 'md5:563d7856ddab99bee7a5e50f45531757',
 | 
						|
            'release_date': '20230722',
 | 
						|
            'release_timestamp': 1690033200,
 | 
						|
            'series': 'Star Trek: Lower Decks',
 | 
						|
            'series_id': 'star-trek-lower-decks',
 | 
						|
            'thumbnail': r're:https?://.+\.(?:jpg|png)',
 | 
						|
        },
 | 
						|
    }, {
 | 
						|
        'url': 'https://www.startrek.com/en-ca/videos/my-first-contact-senator-cory-booker',
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'my-first-contact-senator-cory-booker',
 | 
						|
            'ext': 'mp4',
 | 
						|
            'title': 'My First Contact: Senator Cory Booker',
 | 
						|
            'alt_title': 'md5:fe74a8bdb0afab421c6e159a7680db4d',
 | 
						|
            'categories': ['MY FIRST CONTACT'],
 | 
						|
            'description': 'md5:a3992ab3b3e0395925d71156bbc018ce',
 | 
						|
            'release_date': '20250401',
 | 
						|
            'release_timestamp': 1743512400,
 | 
						|
            'series': 'Star Trek: The Original Series',
 | 
						|
            'series_id': 'star-trek-the-original-series',
 | 
						|
            'thumbnail': r're:https?://.+\.(?:jpg|png)',
 | 
						|
        },
 | 
						|
    }]
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        video_id = self._match_id(url)
 | 
						|
        webpage = self._download_webpage(url, video_id)
 | 
						|
 | 
						|
        page_props = self._search_nextjs_data(webpage, video_id)['props']['pageProps']
 | 
						|
        video_data = page_props['video']['data']
 | 
						|
        if youtube_id := video_data.get('youtube_video_id'):
 | 
						|
            return self.url_result(youtube_id, YoutubeIE)
 | 
						|
 | 
						|
        series_id = traverse_obj(video_data, (
 | 
						|
            'series_and_movies', ..., 'series_or_movie', 'slug', {str}, any))
 | 
						|
 | 
						|
        return {
 | 
						|
            'id': video_id,
 | 
						|
            'series': traverse_obj(page_props, (
 | 
						|
                'queried', 'header', 'tab3', 'slices', ..., 'items',
 | 
						|
                lambda _, v: v['link']['slug'] == series_id, 'link_copy', {str}, any)),
 | 
						|
            'series_id': series_id,
 | 
						|
            **traverse_obj(video_data, {
 | 
						|
                'title': ('title', ..., 'text', {clean_html}, any),
 | 
						|
                'alt_title': ('subhead', ..., 'text', {clean_html}, any),
 | 
						|
                'categories': ('category', 'data', 'category_name', {str.upper}, filter, all),
 | 
						|
                'description': ('slices', ..., 'primary', 'content', ..., 'text', {clean_html}, any),
 | 
						|
                'release_timestamp': ('published', {parse_iso8601}),
 | 
						|
                'subtitles': ({'url': 'legacy_subtitle_file'}, all, {subs_list_to_dict(lang='en')}),
 | 
						|
                'thumbnail': ('poster_frame', 'url', {url_or_none}, {update_url(query=None)}),
 | 
						|
                'url': ('legacy_video_url', {url_or_none}),
 | 
						|
            }),
 | 
						|
        }
 |