123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291 |
- import json
- from .common import InfoExtractor
- from ..utils import ExtractorError, int_or_none, traverse_obj, try_get
- class AmazonMiniTVBaseIE(InfoExtractor):
- def _real_initialize(self):
- self._download_webpage(
- 'https://www.amazon.in/minitv', None,
- note='Fetching guest session cookies')
- AmazonMiniTVBaseIE.session_id = self._get_cookies('https://www.amazon.in')['session-id'].value
- def _call_api(self, asin, data=None, note=None):
- device = {'clientId': 'ATVIN', 'deviceLocale': 'en_GB'}
- if data:
- data['variables'].update({
- 'contentType': 'VOD',
- 'sessionIdToken': self.session_id,
- **device,
- })
- resp = self._download_json(
- f'https://www.amazon.in/minitv/api/web/{"graphql" if data else "prs"}',
- asin, note=note, headers={'Content-Type': 'application/json'},
- data=json.dumps(data).encode() if data else None,
- query=None if data else {
- 'deviceType': 'A1WMMUXPCUJL4N',
- 'contentId': asin,
- **device,
- })
- if resp.get('errors'):
- raise ExtractorError(f'MiniTV said: {resp["errors"][0]["message"]}')
- elif not data:
- return resp
- return resp['data'][data['operationName']]
- class AmazonMiniTVIE(AmazonMiniTVBaseIE):
- _VALID_URL = r'(?:https?://(?:www\.)?amazon\.in/minitv/tp/|amazonminitv:(?:amzn1\.dv\.gti\.)?)(?P<id>[a-f0-9-]+)'
- _TESTS = [{
- 'url': 'https://www.amazon.in/minitv/tp/75fe3a75-b8fe-4499-8100-5c9424344840?referrer=https%3A%2F%2Fwww.amazon.in%2Fminitv',
- 'info_dict': {
- 'id': 'amzn1.dv.gti.75fe3a75-b8fe-4499-8100-5c9424344840',
- 'ext': 'mp4',
- 'title': 'May I Kiss You?',
- 'language': 'Hindi',
- 'thumbnail': r're:^https?://.*\.jpg$',
- 'description': 'md5:a549bfc747973e04feb707833474e59d',
- 'release_timestamp': 1644710400,
- 'release_date': '20220213',
- 'duration': 846,
- 'chapters': 'count:2',
- 'series': 'Couple Goals',
- 'series_id': 'amzn1.dv.gti.56521d46-b040-4fd5-872e-3e70476a04b0',
- 'season': 'Season 3',
- 'season_number': 3,
- 'season_id': 'amzn1.dv.gti.20331016-d9b9-4968-b991-c89fa4927a36',
- 'episode': 'May I Kiss You?',
- 'episode_number': 2,
- 'episode_id': 'amzn1.dv.gti.75fe3a75-b8fe-4499-8100-5c9424344840',
- },
- }, {
- 'url': 'https://www.amazon.in/minitv/tp/280d2564-584f-452f-9c98-7baf906e01ab?referrer=https%3A%2F%2Fwww.amazon.in%2Fminitv',
- 'info_dict': {
- 'id': 'amzn1.dv.gti.280d2564-584f-452f-9c98-7baf906e01ab',
- 'ext': 'mp4',
- 'title': 'Jahaan',
- 'language': 'Hindi',
- 'thumbnail': r're:^https?://.*\.jpg',
- 'description': 'md5:05eb765a77bf703f322f120ec6867339',
- 'release_timestamp': 1647475200,
- 'release_date': '20220317',
- 'duration': 783,
- 'chapters': [],
- },
- }, {
- 'url': 'https://www.amazon.in/minitv/tp/280d2564-584f-452f-9c98-7baf906e01ab',
- 'only_matching': True,
- }, {
- 'url': 'amazonminitv:amzn1.dv.gti.280d2564-584f-452f-9c98-7baf906e01ab',
- 'only_matching': True,
- }, {
- 'url': 'amazonminitv:280d2564-584f-452f-9c98-7baf906e01ab',
- 'only_matching': True,
- }]
- _GRAPHQL_QUERY_CONTENT = '''
- query content($sessionIdToken: String!, $deviceLocale: String, $contentId: ID!, $contentType: ContentType!, $clientId: String) {
- content(
- applicationContextInput: {deviceLocale: $deviceLocale, sessionIdToken: $sessionIdToken, clientId: $clientId}
- contentId: $contentId
- contentType: $contentType
- ) {
- contentId
- name
- ... on Episode {
- contentId
- vodType
- name
- images
- description {
- synopsis
- contentLengthInSeconds
- }
- publicReleaseDateUTC
- audioTracks
- seasonId
- seriesId
- seriesName
- seasonNumber
- episodeNumber
- timecode {
- endCreditsTime
- }
- }
- ... on MovieContent {
- contentId
- vodType
- name
- description {
- synopsis
- contentLengthInSeconds
- }
- images
- publicReleaseDateUTC
- audioTracks
- }
- }
- }'''
- def _real_extract(self, url):
- asin = f'amzn1.dv.gti.{self._match_id(url)}'
- prs = self._call_api(asin, note='Downloading playback info')
- formats, subtitles = [], {}
- for type_, asset in prs['playbackAssets'].items():
- if not traverse_obj(asset, 'manifestUrl'):
- continue
- if type_ == 'hls':
- m3u8_fmts, m3u8_subs = self._extract_m3u8_formats_and_subtitles(
- asset['manifestUrl'], asin, ext='mp4', entry_protocol='m3u8_native',
- m3u8_id=type_, fatal=False)
- formats.extend(m3u8_fmts)
- subtitles = self._merge_subtitles(subtitles, m3u8_subs)
- elif type_ == 'dash':
- mpd_fmts, mpd_subs = self._extract_mpd_formats_and_subtitles(
- asset['manifestUrl'], asin, mpd_id=type_, fatal=False)
- formats.extend(mpd_fmts)
- subtitles = self._merge_subtitles(subtitles, mpd_subs)
- else:
- self.report_warning(f'Unknown asset type: {type_}')
- title_info = self._call_api(
- asin, note='Downloading title info', data={
- 'operationName': 'content',
- 'variables': {'contentId': asin},
- 'query': self._GRAPHQL_QUERY_CONTENT,
- })
- credits_time = try_get(title_info, lambda x: x['timecode']['endCreditsTime'] / 1000)
- is_episode = title_info.get('vodType') == 'EPISODE'
- return {
- 'id': asin,
- 'title': title_info.get('name'),
- 'formats': formats,
- 'subtitles': subtitles,
- 'language': traverse_obj(title_info, ('audioTracks', 0)),
- 'thumbnails': [{
- 'id': type_,
- 'url': url,
- } for type_, url in (title_info.get('images') or {}).items()],
- 'description': traverse_obj(title_info, ('description', 'synopsis')),
- 'release_timestamp': int_or_none(try_get(title_info, lambda x: x['publicReleaseDateUTC'] / 1000)),
- 'duration': traverse_obj(title_info, ('description', 'contentLengthInSeconds')),
- 'chapters': [{
- 'start_time': credits_time,
- 'title': 'End Credits',
- }] if credits_time else [],
- 'series': title_info.get('seriesName'),
- 'series_id': title_info.get('seriesId'),
- 'season_number': title_info.get('seasonNumber'),
- 'season_id': title_info.get('seasonId'),
- 'episode': title_info.get('name') if is_episode else None,
- 'episode_number': title_info.get('episodeNumber'),
- 'episode_id': asin if is_episode else None,
- }
- class AmazonMiniTVSeasonIE(AmazonMiniTVBaseIE):
- IE_NAME = 'amazonminitv:season'
- _VALID_URL = r'amazonminitv:season:(?:amzn1\.dv\.gti\.)?(?P<id>[a-f0-9-]+)'
- IE_DESC = 'Amazon MiniTV Series, "minitv:season:" prefix'
- _TESTS = [{
- 'url': 'amazonminitv:season:amzn1.dv.gti.0aa996eb-6a1b-4886-a342-387fbd2f1db0',
- 'playlist_mincount': 6,
- 'info_dict': {
- 'id': 'amzn1.dv.gti.0aa996eb-6a1b-4886-a342-387fbd2f1db0',
- },
- }, {
- 'url': 'amazonminitv:season:0aa996eb-6a1b-4886-a342-387fbd2f1db0',
- 'only_matching': True,
- }]
- _GRAPHQL_QUERY = '''
- query getEpisodes($sessionIdToken: String!, $clientId: String, $episodeOrSeasonId: ID!, $deviceLocale: String) {
- getEpisodes(
- applicationContextInput: {sessionIdToken: $sessionIdToken, deviceLocale: $deviceLocale, clientId: $clientId}
- episodeOrSeasonId: $episodeOrSeasonId
- ) {
- episodes {
- ... on Episode {
- contentId
- name
- images
- seriesName
- seasonId
- seriesId
- seasonNumber
- episodeNumber
- description {
- synopsis
- contentLengthInSeconds
- }
- publicReleaseDateUTC
- }
- }
- }
- }
- '''
- def _entries(self, asin):
- season_info = self._call_api(
- asin, note='Downloading season info', data={
- 'operationName': 'getEpisodes',
- 'variables': {'episodeOrSeasonId': asin},
- 'query': self._GRAPHQL_QUERY,
- })
- for episode in season_info['episodes']:
- yield self.url_result(
- f'amazonminitv:{episode["contentId"]}', AmazonMiniTVIE, episode['contentId'])
- def _real_extract(self, url):
- asin = f'amzn1.dv.gti.{self._match_id(url)}'
- return self.playlist_result(self._entries(asin), asin)
- class AmazonMiniTVSeriesIE(AmazonMiniTVBaseIE):
- IE_NAME = 'amazonminitv:series'
- _VALID_URL = r'amazonminitv:series:(?:amzn1\.dv\.gti\.)?(?P<id>[a-f0-9-]+)'
- _TESTS = [{
- 'url': 'amazonminitv:series:amzn1.dv.gti.56521d46-b040-4fd5-872e-3e70476a04b0',
- 'playlist_mincount': 3,
- 'info_dict': {
- 'id': 'amzn1.dv.gti.56521d46-b040-4fd5-872e-3e70476a04b0',
- },
- }, {
- 'url': 'amazonminitv:series:56521d46-b040-4fd5-872e-3e70476a04b0',
- 'only_matching': True,
- }]
- _GRAPHQL_QUERY = '''
- query getSeasons($sessionIdToken: String!, $deviceLocale: String, $episodeOrSeasonOrSeriesId: ID!, $clientId: String) {
- getSeasons(
- applicationContextInput: {deviceLocale: $deviceLocale, sessionIdToken: $sessionIdToken, clientId: $clientId}
- episodeOrSeasonOrSeriesId: $episodeOrSeasonOrSeriesId
- ) {
- seasons {
- seasonId
- }
- }
- }
- '''
- def _entries(self, asin):
- season_info = self._call_api(
- asin, note='Downloading series info', data={
- 'operationName': 'getSeasons',
- 'variables': {'episodeOrSeasonOrSeriesId': asin},
- 'query': self._GRAPHQL_QUERY,
- })
- for season in season_info['seasons']:
- yield self.url_result(f'amazonminitv:season:{season["seasonId"]}', AmazonMiniTVSeasonIE, season['seasonId'])
- def _real_extract(self, url):
- asin = f'amzn1.dv.gti.{self._match_id(url)}'
- return self.playlist_result(self._entries(asin), asin)
|