mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-11-03 16:15:14 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			292 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			292 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
import json
 | 
						|
 | 
						|
from .common import InfoExtractor
 | 
						|
from ..utils import ExtractorError, int_or_none, traverse_obj, try_get
 | 
						|
 | 
						|
 | 
						|
class AmazonMiniTVBaseIE(InfoExtractor):
 | 
						|
    def _real_initialize(self):
 | 
						|
        self._download_webpage(
 | 
						|
            'https://www.amazon.in/minitv', None,
 | 
						|
            note='Fetching guest session cookies')
 | 
						|
        AmazonMiniTVBaseIE.session_id = self._get_cookies('https://www.amazon.in')['session-id'].value
 | 
						|
 | 
						|
    def _call_api(self, asin, data=None, note=None):
 | 
						|
        device = {'clientId': 'ATVIN', 'deviceLocale': 'en_GB'}
 | 
						|
        if data:
 | 
						|
            data['variables'].update({
 | 
						|
                'contentType': 'VOD',
 | 
						|
                'sessionIdToken': self.session_id,
 | 
						|
                **device,
 | 
						|
            })
 | 
						|
 | 
						|
        resp = self._download_json(
 | 
						|
            f'https://www.amazon.in/minitv/api/web/{"graphql" if data else "prs"}',
 | 
						|
            asin, note=note, headers={'Content-Type': 'application/json'},
 | 
						|
            data=json.dumps(data).encode() if data else None,
 | 
						|
            query=None if data else {
 | 
						|
                'deviceType': 'A1WMMUXPCUJL4N',
 | 
						|
                'contentId': asin,
 | 
						|
                **device,
 | 
						|
            })
 | 
						|
 | 
						|
        if resp.get('errors'):
 | 
						|
            raise ExtractorError(f'MiniTV said: {resp["errors"][0]["message"]}')
 | 
						|
        elif not data:
 | 
						|
            return resp
 | 
						|
        return resp['data'][data['operationName']]
 | 
						|
 | 
						|
 | 
						|
class AmazonMiniTVIE(AmazonMiniTVBaseIE):
 | 
						|
    _VALID_URL = r'(?:https?://(?:www\.)?amazon\.in/minitv/tp/|amazonminitv:(?:amzn1\.dv\.gti\.)?)(?P<id>[a-f0-9-]+)'
 | 
						|
    _TESTS = [{
 | 
						|
        'url': 'https://www.amazon.in/minitv/tp/75fe3a75-b8fe-4499-8100-5c9424344840?referrer=https%3A%2F%2Fwww.amazon.in%2Fminitv',
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'amzn1.dv.gti.75fe3a75-b8fe-4499-8100-5c9424344840',
 | 
						|
            'ext': 'mp4',
 | 
						|
            'title': 'May I Kiss You?',
 | 
						|
            'language': 'Hindi',
 | 
						|
            'thumbnail': r're:^https?://.*\.jpg$',
 | 
						|
            'description': 'md5:a549bfc747973e04feb707833474e59d',
 | 
						|
            'release_timestamp': 1644710400,
 | 
						|
            'release_date': '20220213',
 | 
						|
            'duration': 846,
 | 
						|
            'chapters': 'count:2',
 | 
						|
            'series': 'Couple Goals',
 | 
						|
            'series_id': 'amzn1.dv.gti.56521d46-b040-4fd5-872e-3e70476a04b0',
 | 
						|
            'season': 'Season 3',
 | 
						|
            'season_number': 3,
 | 
						|
            'season_id': 'amzn1.dv.gti.20331016-d9b9-4968-b991-c89fa4927a36',
 | 
						|
            'episode': 'May I Kiss You?',
 | 
						|
            'episode_number': 2,
 | 
						|
            'episode_id': 'amzn1.dv.gti.75fe3a75-b8fe-4499-8100-5c9424344840',
 | 
						|
        },
 | 
						|
    }, {
 | 
						|
        'url': 'https://www.amazon.in/minitv/tp/280d2564-584f-452f-9c98-7baf906e01ab?referrer=https%3A%2F%2Fwww.amazon.in%2Fminitv',
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'amzn1.dv.gti.280d2564-584f-452f-9c98-7baf906e01ab',
 | 
						|
            'ext': 'mp4',
 | 
						|
            'title': 'Jahaan',
 | 
						|
            'language': 'Hindi',
 | 
						|
            'thumbnail': r're:^https?://.*\.jpg',
 | 
						|
            'description': 'md5:05eb765a77bf703f322f120ec6867339',
 | 
						|
            'release_timestamp': 1647475200,
 | 
						|
            'release_date': '20220317',
 | 
						|
            'duration': 783,
 | 
						|
            'chapters': [],
 | 
						|
        },
 | 
						|
    }, {
 | 
						|
        'url': 'https://www.amazon.in/minitv/tp/280d2564-584f-452f-9c98-7baf906e01ab',
 | 
						|
        'only_matching': True,
 | 
						|
    }, {
 | 
						|
        'url': 'amazonminitv:amzn1.dv.gti.280d2564-584f-452f-9c98-7baf906e01ab',
 | 
						|
        'only_matching': True,
 | 
						|
    }, {
 | 
						|
        'url': 'amazonminitv:280d2564-584f-452f-9c98-7baf906e01ab',
 | 
						|
        'only_matching': True,
 | 
						|
    }]
 | 
						|
 | 
						|
    _GRAPHQL_QUERY_CONTENT = '''
 | 
						|
query content($sessionIdToken: String!, $deviceLocale: String, $contentId: ID!, $contentType: ContentType!, $clientId: String) {
 | 
						|
  content(
 | 
						|
    applicationContextInput: {deviceLocale: $deviceLocale, sessionIdToken: $sessionIdToken, clientId: $clientId}
 | 
						|
    contentId: $contentId
 | 
						|
    contentType: $contentType
 | 
						|
  ) {
 | 
						|
    contentId
 | 
						|
    name
 | 
						|
    ... on Episode {
 | 
						|
      contentId
 | 
						|
      vodType
 | 
						|
      name
 | 
						|
      images
 | 
						|
      description {
 | 
						|
        synopsis
 | 
						|
        contentLengthInSeconds
 | 
						|
      }
 | 
						|
      publicReleaseDateUTC
 | 
						|
      audioTracks
 | 
						|
      seasonId
 | 
						|
      seriesId
 | 
						|
      seriesName
 | 
						|
      seasonNumber
 | 
						|
      episodeNumber
 | 
						|
      timecode {
 | 
						|
        endCreditsTime
 | 
						|
      }
 | 
						|
    }
 | 
						|
    ... on MovieContent {
 | 
						|
      contentId
 | 
						|
      vodType
 | 
						|
      name
 | 
						|
      description {
 | 
						|
        synopsis
 | 
						|
        contentLengthInSeconds
 | 
						|
      }
 | 
						|
      images
 | 
						|
      publicReleaseDateUTC
 | 
						|
      audioTracks
 | 
						|
    }
 | 
						|
  }
 | 
						|
}'''
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        asin = f'amzn1.dv.gti.{self._match_id(url)}'
 | 
						|
        prs = self._call_api(asin, note='Downloading playback info')
 | 
						|
 | 
						|
        formats, subtitles = [], {}
 | 
						|
        for type_, asset in prs['playbackAssets'].items():
 | 
						|
            if not traverse_obj(asset, 'manifestUrl'):
 | 
						|
                continue
 | 
						|
            if type_ == 'hls':
 | 
						|
                m3u8_fmts, m3u8_subs = self._extract_m3u8_formats_and_subtitles(
 | 
						|
                    asset['manifestUrl'], asin, ext='mp4', entry_protocol='m3u8_native',
 | 
						|
                    m3u8_id=type_, fatal=False)
 | 
						|
                formats.extend(m3u8_fmts)
 | 
						|
                subtitles = self._merge_subtitles(subtitles, m3u8_subs)
 | 
						|
            elif type_ == 'dash':
 | 
						|
                mpd_fmts, mpd_subs = self._extract_mpd_formats_and_subtitles(
 | 
						|
                    asset['manifestUrl'], asin, mpd_id=type_, fatal=False)
 | 
						|
                formats.extend(mpd_fmts)
 | 
						|
                subtitles = self._merge_subtitles(subtitles, mpd_subs)
 | 
						|
            else:
 | 
						|
                self.report_warning(f'Unknown asset type: {type_}')
 | 
						|
 | 
						|
        title_info = self._call_api(
 | 
						|
            asin, note='Downloading title info', data={
 | 
						|
                'operationName': 'content',
 | 
						|
                'variables': {'contentId': asin},
 | 
						|
                'query': self._GRAPHQL_QUERY_CONTENT,
 | 
						|
            })
 | 
						|
        credits_time = try_get(title_info, lambda x: x['timecode']['endCreditsTime'] / 1000)
 | 
						|
        is_episode = title_info.get('vodType') == 'EPISODE'
 | 
						|
 | 
						|
        return {
 | 
						|
            'id': asin,
 | 
						|
            'title': title_info.get('name'),
 | 
						|
            'formats': formats,
 | 
						|
            'subtitles': subtitles,
 | 
						|
            'language': traverse_obj(title_info, ('audioTracks', 0)),
 | 
						|
            'thumbnails': [{
 | 
						|
                'id': type_,
 | 
						|
                'url': url,
 | 
						|
            } for type_, url in (title_info.get('images') or {}).items()],
 | 
						|
            'description': traverse_obj(title_info, ('description', 'synopsis')),
 | 
						|
            'release_timestamp': int_or_none(try_get(title_info, lambda x: x['publicReleaseDateUTC'] / 1000)),
 | 
						|
            'duration': traverse_obj(title_info, ('description', 'contentLengthInSeconds')),
 | 
						|
            'chapters': [{
 | 
						|
                'start_time': credits_time,
 | 
						|
                'title': 'End Credits',
 | 
						|
            }] if credits_time else [],
 | 
						|
            'series': title_info.get('seriesName'),
 | 
						|
            'series_id': title_info.get('seriesId'),
 | 
						|
            'season_number': title_info.get('seasonNumber'),
 | 
						|
            'season_id': title_info.get('seasonId'),
 | 
						|
            'episode': title_info.get('name') if is_episode else None,
 | 
						|
            'episode_number': title_info.get('episodeNumber'),
 | 
						|
            'episode_id': asin if is_episode else None,
 | 
						|
        }
 | 
						|
 | 
						|
 | 
						|
class AmazonMiniTVSeasonIE(AmazonMiniTVBaseIE):
 | 
						|
    IE_NAME = 'amazonminitv:season'
 | 
						|
    _VALID_URL = r'amazonminitv:season:(?:amzn1\.dv\.gti\.)?(?P<id>[a-f0-9-]+)'
 | 
						|
    IE_DESC = 'Amazon MiniTV Season, "minitv:season:" prefix'
 | 
						|
    _TESTS = [{
 | 
						|
        'url': 'amazonminitv:season:amzn1.dv.gti.0aa996eb-6a1b-4886-a342-387fbd2f1db0',
 | 
						|
        'playlist_mincount': 6,
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'amzn1.dv.gti.0aa996eb-6a1b-4886-a342-387fbd2f1db0',
 | 
						|
        },
 | 
						|
    }, {
 | 
						|
        'url': 'amazonminitv:season:0aa996eb-6a1b-4886-a342-387fbd2f1db0',
 | 
						|
        'only_matching': True,
 | 
						|
    }]
 | 
						|
 | 
						|
    _GRAPHQL_QUERY = '''
 | 
						|
query getEpisodes($sessionIdToken: String!, $clientId: String, $episodeOrSeasonId: ID!, $deviceLocale: String) {
 | 
						|
  getEpisodes(
 | 
						|
    applicationContextInput: {sessionIdToken: $sessionIdToken, deviceLocale: $deviceLocale, clientId: $clientId}
 | 
						|
    episodeOrSeasonId: $episodeOrSeasonId
 | 
						|
  ) {
 | 
						|
    episodes {
 | 
						|
      ... on Episode {
 | 
						|
        contentId
 | 
						|
        name
 | 
						|
        images
 | 
						|
        seriesName
 | 
						|
        seasonId
 | 
						|
        seriesId
 | 
						|
        seasonNumber
 | 
						|
        episodeNumber
 | 
						|
        description {
 | 
						|
          synopsis
 | 
						|
          contentLengthInSeconds
 | 
						|
        }
 | 
						|
        publicReleaseDateUTC
 | 
						|
      }
 | 
						|
    }
 | 
						|
  }
 | 
						|
}
 | 
						|
'''
 | 
						|
 | 
						|
    def _entries(self, asin):
 | 
						|
        season_info = self._call_api(
 | 
						|
            asin, note='Downloading season info', data={
 | 
						|
                'operationName': 'getEpisodes',
 | 
						|
                'variables': {'episodeOrSeasonId': asin},
 | 
						|
                'query': self._GRAPHQL_QUERY,
 | 
						|
            })
 | 
						|
 | 
						|
        for episode in season_info['episodes']:
 | 
						|
            yield self.url_result(
 | 
						|
                f'amazonminitv:{episode["contentId"]}', AmazonMiniTVIE, episode['contentId'])
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        asin = f'amzn1.dv.gti.{self._match_id(url)}'
 | 
						|
        return self.playlist_result(self._entries(asin), asin)
 | 
						|
 | 
						|
 | 
						|
class AmazonMiniTVSeriesIE(AmazonMiniTVBaseIE):
 | 
						|
    IE_NAME = 'amazonminitv:series'
 | 
						|
    _VALID_URL = r'amazonminitv:series:(?:amzn1\.dv\.gti\.)?(?P<id>[a-f0-9-]+)'
 | 
						|
    IE_DESC = 'Amazon MiniTV Series, "minitv:series:" prefix'
 | 
						|
    _TESTS = [{
 | 
						|
        'url': 'amazonminitv:series:amzn1.dv.gti.56521d46-b040-4fd5-872e-3e70476a04b0',
 | 
						|
        'playlist_mincount': 3,
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'amzn1.dv.gti.56521d46-b040-4fd5-872e-3e70476a04b0',
 | 
						|
        },
 | 
						|
    }, {
 | 
						|
        'url': 'amazonminitv:series:56521d46-b040-4fd5-872e-3e70476a04b0',
 | 
						|
        'only_matching': True,
 | 
						|
    }]
 | 
						|
 | 
						|
    _GRAPHQL_QUERY = '''
 | 
						|
query getSeasons($sessionIdToken: String!, $deviceLocale: String, $episodeOrSeasonOrSeriesId: ID!, $clientId: String) {
 | 
						|
  getSeasons(
 | 
						|
    applicationContextInput: {deviceLocale: $deviceLocale, sessionIdToken: $sessionIdToken, clientId: $clientId}
 | 
						|
    episodeOrSeasonOrSeriesId: $episodeOrSeasonOrSeriesId
 | 
						|
  ) {
 | 
						|
    seasons {
 | 
						|
      seasonId
 | 
						|
    }
 | 
						|
  }
 | 
						|
}
 | 
						|
'''
 | 
						|
 | 
						|
    def _entries(self, asin):
 | 
						|
        season_info = self._call_api(
 | 
						|
            asin, note='Downloading series info', data={
 | 
						|
                'operationName': 'getSeasons',
 | 
						|
                'variables': {'episodeOrSeasonOrSeriesId': asin},
 | 
						|
                'query': self._GRAPHQL_QUERY,
 | 
						|
            })
 | 
						|
 | 
						|
        for season in season_info['seasons']:
 | 
						|
            yield self.url_result(f'amazonminitv:season:{season["seasonId"]}', AmazonMiniTVSeasonIE, season['seasonId'])
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        asin = f'amzn1.dv.gti.{self._match_id(url)}'
 | 
						|
        return self.playlist_result(self._entries(asin), asin)
 |