mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-11-03 16:15:14 +00:00 
			
		
		
		
	Closes #1770, Closes #8073 Authored by: maxbin123, bashonly Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
		
			
				
	
	
		
			306 lines
		
	
	
		
			15 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			306 lines
		
	
	
		
			15 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
import re
 | 
						||
 | 
						||
from .adobepass import AdobePassIE
 | 
						||
from ..utils import (
 | 
						||
    ExtractorError,
 | 
						||
    determine_ext,
 | 
						||
    int_or_none,
 | 
						||
    join_nonempty,
 | 
						||
    parse_age_limit,
 | 
						||
    unified_timestamp,
 | 
						||
    urlencode_postdata,
 | 
						||
)
 | 
						||
from ..utils.traversal import traverse_obj
 | 
						||
 | 
						||
 | 
						||
class GoIE(AdobePassIE):
 | 
						||
    _SITE_INFO = {
 | 
						||
        'abc': {
 | 
						||
            'brand': '001',
 | 
						||
            'requestor_id': 'dtci',
 | 
						||
            'provider_id': 'ABC',
 | 
						||
            'software_statement': 'eyJhbGciOiJSUzI1NiJ9.eyJzdWIiOiI4OTcwMjlkYS0yYjM1LTQyOWUtYWQ0NS02ZjZiZjVkZTdhOTUiLCJuYmYiOjE2MjAxNzM5NjksImlzcyI6ImF1dGguYWRvYmUuY29tIiwiaWF0IjoxNjIwMTczOTY5fQ.SC69DVJWSL8sIe-vVUrP6xS_kzHKqwz9PdKYexs_y-f7Vin6mM-7S-W1TE_-K55O0pyf-TL4xYgvm6LIye8CckG-nZfVwNPV4huduov0jmIcxCQFeUwkHULG2IaA44wfBVUBdaHgkhPweZ2amjycO_IXtez-gBXOLbE3B7Gx9j_5ISCFtyVUblThKfoGyQv6KT6t8Vpmc4ZSKCCQp74KWFFypydb9ucego1taW_nQD06Cdf4yByLd6NaTBceMcIKbug9b9gxFm3XBgJ5q3z7KGo1Kr6XalAV5j4m-fQ91wczlTilX8FM4AljMupyRM9mA_aEADILQ4hS79q4SM0w6w',
 | 
						||
        },
 | 
						||
        'freeform': {
 | 
						||
            'brand': '002',
 | 
						||
            'requestor_id': 'ABCFamily',
 | 
						||
            'provider_id': 'ABCFamily',
 | 
						||
            'software_statement': 'eyJhbGciOiJSUzI1NiJ9.eyJzdWIiOiJhZWM2MGYyNC0xYzRjLTQ1NzQtYjc0Zi03ZmM4N2E5YWMzMzgiLCJuYmYiOjE1ODc2NjU5MjMsImlzcyI6ImF1dGguYWRvYmUuY29tIiwiaWF0IjoxNTg3NjY1OTIzfQ.flCn3dhvmvPnWmV0JV8Fm0YFyj07yPez9-n1GFEwVIm_S2wQVWbWyJhqsAyLZVFrhOMZYTqmPS3OHxGwTwXkEYn6PD7o_vIVG3oqi-Xn1m5jRt_Gazw5qEtpat6VE7bvKGSD3ZhcidOrsCk8NcYyq75u61NHDvSl81pcedJjVRVUpsqrEwmo0aVbA0C8PX3ri0mEbGvkMKvHn8E60xp-PSE-VK8SDT0plwPu_TwUszkZ6-_I8_2xcv_WBqcXFkAVg7Q-iNJXgQvmNsrpcrYuLvi6hEH4ZLtoDcXU6MhwTQAJTiHSo8x9aHX1_qFP09CzlNOFQbC2ZEJdP9SvA53SLQ',
 | 
						||
        },
 | 
						||
        'disneynow': {
 | 
						||
            'brand': '011',  # also: '004', '008', '009'
 | 
						||
            'requestor_id': 'DisneyChannels',
 | 
						||
            'provider_id': 'DisneyChannels',
 | 
						||
            'software_statement': 'eyJhbGciOiJSUzI1NiJ9.eyJzdWIiOiI1MzAzNTRiOS04NDNiLTRkNjAtYTQ3ZS0yNzk1MzlkOTIyNTciLCJuYmYiOjE1NTg5ODc0NDksImlzcyI6ImF1dGguYWRvYmUuY29tIiwiaWF0IjoxNTU4OTg3NDQ5fQ.Jud6YS6-J2h0h6po0oMheDym0qRTJQGj4kzacrz4DFuEwhcBkkykW6pF5pKuAUJy9HCZ40oDAHe2KcTlDJjCZF5tDaUEfdihakZ9cC_rG7MU-QoRne8qaB_dPDKwGuk-ZyWD8eV3zwTJmbGo8hDxYTEU81YNCxwhyc_BPDr5TYiubbmpP3_pTnXmSpuL58isJ2peSKWlX9BacuXtBY25c_QnPFKk-_EETm7IHkTpDazde1QfHWGu4s4yJpKGk8RVVujVG6h6ELlL-ZeYLilBm7iS7h1TYG1u7fJhyZRL7isaom6NvAzsvN3ngss1fLwt8decP8wzdFHrbYTdTjW8qw',
 | 
						||
            'resource_id': 'Disney',
 | 
						||
        },
 | 
						||
        'fxnetworks': {
 | 
						||
            'brand': '025',  # also: '020'
 | 
						||
            'requestor_id': 'dtci',
 | 
						||
            'provider_id': 'fx',  # also 'fxx', 'fxm'
 | 
						||
            'software_statement': 'eyJhbGciOiJSUzI1NiJ9.eyJzdWIiOiIzYWRhYWZiNC02OTAxLTRlYzktOTdmNy1lYWZkZTJkODJkN2EiLCJuYmYiOjE1NjIwMjQwNzYsImlzcyI6ImF1dGguYWRvYmUuY29tIiwiaWF0IjoxNTYyMDI0MDc2fQ.dhKMpZK50AObbZYrMiYPSfWtzXHUaeMP3jrIY4Cgfvh0GaEgk0Mns_zp78jypFeZgRtPVleQMQDNq2YEloRLcAGqP1aa6WVDglnK77ZWUm4IKai14Rwf3A6YBhSRoO2_lMmUGkuTf6gZY-kMIPqBYKqzTQiQl4HbniPFodIzFRiuI9QJVrkoyTGrJL4oqiX08PoFI3Z-TOti1Heu3EbFC-GveQHhlinYrzU7rbiAqLEz7FImtfBDsnXX1Y3uJDLYM3Bq4Oh0nrzTv1Fd62wNsCNErHHIbELidh1zZF0ujvt7ReuZUwAitm0UhEJ7OxNOUbEQWtae6pVNscvdvTFMpg',
 | 
						||
        },
 | 
						||
        'nationalgeographic': {
 | 
						||
            'brand': '026',  # also '023'
 | 
						||
            'requestor_id': 'dtci',
 | 
						||
            'provider_id': 'ngc',  # also 'ngw'
 | 
						||
            'software_statement': 'eyJhbGciOiJSUzI1NiJ9.eyJzdWIiOiIxMzE4YTM1Ni05Mjc4LTQ4NjEtYTFmNi1jMTIzMzg1ZWMzYzMiLCJuYmYiOjE1NjIwMjM4MjgsImlzcyI6ImF1dGguYWRvYmUuY29tIiwiaWF0IjoxNTYyMDIzODI4fQ.Le-2OzF9-jrhJ7ZfWtLWk5iSHGVZoxeU1w0_fO--Heli0OwRZsRq2slSmx-oZTzxuWmAgDEiBkWSDcDK6sM25DrCLsdsJa3MBuZ-slBRtH8aq3HpNoqqLkU-vg6gRUEKMtwBUtwCu_9aKUCayYtndWv4b1DjVQeSrteOW5NNudWVYleAe0kxeNJQHo5If9SCzDudKVJktFUjhNks4QPOC_uONPkRRlL9D0fNvtOY-LRFckfcHhf5z9l1iZjeukV0YhdKnuw1wyiaWrQXBUDiBfbkCRd2DM-KnelqPxfiXCaTjGKDURRBO3pz33ebge3IFXSiU5vl4qHQ8xvunzGpFw',
 | 
						||
        },
 | 
						||
    }
 | 
						||
    _URL_PATH_RE = r'(?:video|episode|movies-and-specials)/(?P<id>[\da-f]{8}-(?:[\da-f]{4}-){3}[\da-f]{12})'
 | 
						||
    _VALID_URL = [
 | 
						||
        fr'https?://(?:www\.)?(?P<site>abc)\.com/{_URL_PATH_RE}',
 | 
						||
        fr'https?://(?:www\.)?(?P<site>freeform)\.com/{_URL_PATH_RE}',
 | 
						||
        fr'https?://(?:www\.)?(?P<site>disneynow)\.com/{_URL_PATH_RE}',
 | 
						||
        fr'https?://fxnow\.(?P<site>fxnetworks)\.com/{_URL_PATH_RE}',
 | 
						||
        fr'https?://(?:www\.)?(?P<site>nationalgeographic)\.com/tv/{_URL_PATH_RE}',
 | 
						||
    ]
 | 
						||
    _TESTS = [{
 | 
						||
        'url': 'https://abc.com/episode/4192c0e6-26e5-47a8-817b-ce8272b9e440/playlist/PL551127435',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'VDKA10805898',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'Switch the Flip',
 | 
						||
            'description': 'To help get Brian’s life in order, Stewie and Brian swap bodies using a machine that Stewie invents.',
 | 
						||
            'age_limit': 14,
 | 
						||
            'duration': 1297,
 | 
						||
            'thumbnail': r're:https?://.+/.+\.jpg',
 | 
						||
            'series': 'Family Guy',
 | 
						||
            'season': 'Season 16',
 | 
						||
            'season_number': 16,
 | 
						||
            'episode': 'Episode 17',
 | 
						||
            'episode_number': 17,
 | 
						||
            'timestamp': 1746082800.0,
 | 
						||
            'upload_date': '20250501',
 | 
						||
        },
 | 
						||
        'params': {'skip_download': 'm3u8'},
 | 
						||
        'skip': 'This video requires AdobePass MSO credentials',
 | 
						||
    }, {
 | 
						||
        'url': 'https://disneynow.com/episode/21029660-ba06-4406-adb0-a9a78f6e265e/playlist/PL553044961',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'VDKA39546942',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'Zero Friends Again',
 | 
						||
            'description': 'Relationships fray under the pressures of a difficult journey.',
 | 
						||
            'age_limit': 0,
 | 
						||
            'duration': 1721,
 | 
						||
            'thumbnail': r're:https?://.+/.+\.jpg',
 | 
						||
            'series': 'Star Wars: Skeleton Crew',
 | 
						||
            'season': 'Season 1',
 | 
						||
            'season_number': 1,
 | 
						||
            'episode': 'Episode 6',
 | 
						||
            'episode_number': 6,
 | 
						||
            'timestamp': 1746946800.0,
 | 
						||
            'upload_date': '20250511',
 | 
						||
        },
 | 
						||
        'params': {'skip_download': 'm3u8'},
 | 
						||
        'skip': 'This video requires AdobePass MSO credentials',
 | 
						||
    }, {
 | 
						||
        'url': 'https://fxnow.fxnetworks.com/episode/09f4fa6f-c293-469e-aebe-32c9ca5842a7/playlist/PL554408064',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'VDKA38112033',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'The Return of Jerry',
 | 
						||
            'description': 'The vampires’ long-lost fifth roommate returns. Written by Paul Simms; directed by Kyle Newacheck.',
 | 
						||
            'age_limit': 17,
 | 
						||
            'duration': 1493,
 | 
						||
            'thumbnail': r're:https?://.+/.+\.jpg',
 | 
						||
            'series': 'What We Do in the Shadows',
 | 
						||
            'season': 'Season 6',
 | 
						||
            'season_number': 6,
 | 
						||
            'episode': 'Episode 1',
 | 
						||
            'episode_number': 1,
 | 
						||
            'timestamp': 1729573200.0,
 | 
						||
            'upload_date': '20241022',
 | 
						||
        },
 | 
						||
        'params': {'skip_download': 'm3u8'},
 | 
						||
        'skip': 'This video requires AdobePass MSO credentials',
 | 
						||
    }, {
 | 
						||
        'url': 'https://www.freeform.com/episode/bda0eaf7-761a-4838-aa44-96f794000844/playlist/PL553044961',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'VDKA39007340',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'Angel\'s Landing',
 | 
						||
            'description': 'md5:91bf084e785c968fab16734df7313446',
 | 
						||
            'age_limit': 14,
 | 
						||
            'duration': 2523,
 | 
						||
            'thumbnail': r're:https?://.+/.+\.jpg',
 | 
						||
            'series': 'How I Escaped My Cult',
 | 
						||
            'season': 'Season 1',
 | 
						||
            'season_number': 1,
 | 
						||
            'episode': 'Episode 2',
 | 
						||
            'episode_number': 2,
 | 
						||
            'timestamp': 1740038400.0,
 | 
						||
            'upload_date': '20250220',
 | 
						||
        },
 | 
						||
        'params': {'skip_download': 'm3u8'},
 | 
						||
    }, {
 | 
						||
        'url': 'https://www.nationalgeographic.com/tv/episode/ca694661-1186-41ae-8089-82f64d69b16d/playlist/PL554408064',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'VDKA39492078',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'Heart of the Emperors',
 | 
						||
            'description': 'md5:4fc50a2878f030bb3a7eac9124dca677',
 | 
						||
            'age_limit': 0,
 | 
						||
            'duration': 2775,
 | 
						||
            'thumbnail': r're:https?://.+/.+\.jpg',
 | 
						||
            'series': 'Secrets of the Penguins',
 | 
						||
            'season': 'Season 1',
 | 
						||
            'season_number': 1,
 | 
						||
            'episode': 'Episode 1',
 | 
						||
            'episode_number': 1,
 | 
						||
            'timestamp': 1745204400.0,
 | 
						||
            'upload_date': '20250421',
 | 
						||
        },
 | 
						||
        'params': {'skip_download': 'm3u8'},
 | 
						||
    }, {
 | 
						||
        'url': 'https://www.freeform.com/movies-and-specials/c38281fc-9f8f-47c7-8220-22394f9df2e1',
 | 
						||
        'only_matching': True,
 | 
						||
    }, {
 | 
						||
        'url': 'https://abc.com/video/219a454a-172c-41bf-878a-d169e6bc0bdc/playlist/PL5523098420',
 | 
						||
        'only_matching': True,
 | 
						||
    }]
 | 
						||
 | 
						||
    def _extract_videos(self, brand, video_id='-1', show_id='-1'):
 | 
						||
        display_id = video_id if video_id != '-1' else show_id
 | 
						||
        return self._download_json(
 | 
						||
            f'http://api.contents.watchabc.go.com/vp2/ws/contents/3000/videos/{brand}/001/-1/{show_id}/-1/{video_id}/-1/-1.json',
 | 
						||
            display_id)['video']
 | 
						||
 | 
						||
    def _extract_global_var(self, name, webpage, video_id):
 | 
						||
        return self._search_json(
 | 
						||
            fr'window\[["\']{re.escape(name)}["\']\]\s*=',
 | 
						||
            webpage, f'{name.strip("_")} JSON', video_id)
 | 
						||
 | 
						||
    def _real_extract(self, url):
 | 
						||
        site, display_id = self._match_valid_url(url).group('site', 'id')
 | 
						||
        webpage = self._download_webpage(url, display_id)
 | 
						||
        config = self._extract_global_var('__CONFIG__', webpage, display_id)
 | 
						||
        data = self._extract_global_var(config['globalVar'], webpage, display_id)
 | 
						||
        video_id = traverse_obj(data, (
 | 
						||
            'page', 'content', 'video', 'layout', (('video', 'id'), 'videoid'), {str}, any))
 | 
						||
        if not video_id:
 | 
						||
            video_id = self._search_regex([
 | 
						||
                # data-track-video_id="VDKA39492078"
 | 
						||
                # data-track-video_id_code="vdka39492078"
 | 
						||
                # data-video-id="'VDKA3609139'"
 | 
						||
                r'data-(?:track-)?video[_-]id(?:_code)?=["\']*((?:vdka|VDKA)\d+)',
 | 
						||
                # page.analytics.videoIdCode
 | 
						||
                r'\bvideoIdCode["\']\s*:\s*["\']((?:vdka|VDKA)\d+)'], webpage, 'video ID')
 | 
						||
 | 
						||
        site_info = self._SITE_INFO[site]
 | 
						||
        brand = site_info['brand']
 | 
						||
        video_data = self._extract_videos(brand, video_id)[0]
 | 
						||
        video_id = video_data['id']
 | 
						||
        title = video_data['title']
 | 
						||
 | 
						||
        formats = []
 | 
						||
        subtitles = {}
 | 
						||
        for asset in video_data.get('assets', {}).get('asset', []):
 | 
						||
            asset_url = asset.get('value')
 | 
						||
            if not asset_url:
 | 
						||
                continue
 | 
						||
            format_id = asset.get('format')
 | 
						||
            ext = determine_ext(asset_url)
 | 
						||
            if ext == 'm3u8':
 | 
						||
                video_type = video_data.get('type')
 | 
						||
                data = {
 | 
						||
                    'video_id': video_id,
 | 
						||
                    'video_type': video_type,
 | 
						||
                    'brand': brand,
 | 
						||
                    'device': '001',
 | 
						||
                    'app_name': 'webplayer-abc',
 | 
						||
                }
 | 
						||
                if video_data.get('accesslevel') == '1':
 | 
						||
                    provider_id = site_info['provider_id']
 | 
						||
                    software_statement = traverse_obj(data, ('app', 'config', (
 | 
						||
                        ('features', 'auth', 'softwareStatement'),
 | 
						||
                        ('tvAuth', 'SOFTWARE_STATEMENTS', 'PRODUCTION'),
 | 
						||
                    ), {str}, any)) or site_info['software_statement']
 | 
						||
                    resource = site_info.get('resource_id') or self._get_mvpd_resource(
 | 
						||
                        provider_id, title, video_id, None)
 | 
						||
                    auth = self._extract_mvpd_auth(
 | 
						||
                        url, video_id, site_info['requestor_id'], resource, software_statement)
 | 
						||
                    data.update({
 | 
						||
                        'token': auth,
 | 
						||
                        'token_type': 'ap',
 | 
						||
                        'adobe_requestor_id': provider_id,
 | 
						||
                    })
 | 
						||
                else:
 | 
						||
                    self._initialize_geo_bypass({'countries': ['US']})
 | 
						||
                entitlement = self._download_json(
 | 
						||
                    'https://prod.gatekeeper.us-abc.symphony.edgedatg.go.com/vp2/ws-secure/entitlement/2020/playmanifest_secure.json',
 | 
						||
                    video_id, data=urlencode_postdata(data))
 | 
						||
                errors = entitlement.get('errors', {}).get('errors', [])
 | 
						||
                if errors:
 | 
						||
                    for error in errors:
 | 
						||
                        if error.get('code') == 1002:
 | 
						||
                            self.raise_geo_restricted(
 | 
						||
                                error['message'], countries=['US'])
 | 
						||
                    error_message = ', '.join([error['message'] for error in errors])
 | 
						||
                    raise ExtractorError(f'{self.IE_NAME} said: {error_message}', expected=True)
 | 
						||
                asset_url += '?' + entitlement['entitlement']['uplynkData']['sessionKey']
 | 
						||
                fmts, subs = self._extract_m3u8_formats_and_subtitles(
 | 
						||
                    asset_url, video_id, 'mp4', m3u8_id=format_id or 'hls', fatal=False)
 | 
						||
                formats.extend(fmts)
 | 
						||
                self._merge_subtitles(subs, target=subtitles)
 | 
						||
            else:
 | 
						||
                f = {
 | 
						||
                    'format_id': format_id,
 | 
						||
                    'url': asset_url,
 | 
						||
                    'ext': ext,
 | 
						||
                }
 | 
						||
                if re.search(r'(?:/mp4/source/|_source\.mp4)', asset_url):
 | 
						||
                    f.update({
 | 
						||
                        'format_id': (f'{format_id}-' if format_id else '') + 'SOURCE',
 | 
						||
                        'quality': 1,
 | 
						||
                    })
 | 
						||
                else:
 | 
						||
                    mobj = re.search(r'/(\d+)x(\d+)/', asset_url)
 | 
						||
                    if mobj:
 | 
						||
                        height = int(mobj.group(2))
 | 
						||
                        f.update({
 | 
						||
                            'format_id': join_nonempty(format_id, f'{height}P'),
 | 
						||
                            'width': int(mobj.group(1)),
 | 
						||
                            'height': height,
 | 
						||
                        })
 | 
						||
                formats.append(f)
 | 
						||
 | 
						||
        for cc in video_data.get('closedcaption', {}).get('src', []):
 | 
						||
            cc_url = cc.get('value')
 | 
						||
            if not cc_url:
 | 
						||
                continue
 | 
						||
            ext = determine_ext(cc_url)
 | 
						||
            if ext == 'xml':
 | 
						||
                ext = 'ttml'
 | 
						||
            subtitles.setdefault(cc.get('lang'), []).append({
 | 
						||
                'url': cc_url,
 | 
						||
                'ext': ext,
 | 
						||
            })
 | 
						||
 | 
						||
        thumbnails = []
 | 
						||
        for thumbnail in video_data.get('thumbnails', {}).get('thumbnail', []):
 | 
						||
            thumbnail_url = thumbnail.get('value')
 | 
						||
            if not thumbnail_url:
 | 
						||
                continue
 | 
						||
            thumbnails.append({
 | 
						||
                'url': thumbnail_url,
 | 
						||
                'width': int_or_none(thumbnail.get('width')),
 | 
						||
                'height': int_or_none(thumbnail.get('height')),
 | 
						||
            })
 | 
						||
 | 
						||
        return {
 | 
						||
            'id': video_id,
 | 
						||
            'title': title,
 | 
						||
            'description': video_data.get('longdescription') or video_data.get('description'),
 | 
						||
            'duration': int_or_none(video_data.get('duration', {}).get('value'), 1000),
 | 
						||
            'age_limit': parse_age_limit(video_data.get('tvrating', {}).get('rating')),
 | 
						||
            'episode_number': int_or_none(video_data.get('episodenumber')),
 | 
						||
            'series': video_data.get('show', {}).get('title'),
 | 
						||
            'season_number': int_or_none(video_data.get('season', {}).get('num')),
 | 
						||
            'thumbnails': thumbnails,
 | 
						||
            'formats': formats,
 | 
						||
            'subtitles': subtitles,
 | 
						||
            'timestamp': unified_timestamp(traverse_obj(video_data, ('airdates', 'airdate', 0))),
 | 
						||
        }
 |