mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-30 22:25:19 +00:00 
			
		
		
		
	[funk] fix extraction(closes #17915)
This commit is contained in:
		| @@ -1,89 +1,21 @@ | ||||
| # coding: utf-8 | ||||
| from __future__ import unicode_literals | ||||
|  | ||||
| import itertools | ||||
| import re | ||||
|  | ||||
| from .common import InfoExtractor | ||||
| from .nexx import NexxIE | ||||
| from ..compat import compat_str | ||||
| from ..utils import ( | ||||
|     int_or_none, | ||||
|     try_get, | ||||
|     str_or_none, | ||||
| ) | ||||
|  | ||||
|  | ||||
| class FunkBaseIE(InfoExtractor): | ||||
|     _HEADERS = { | ||||
|         'Accept': '*/*', | ||||
|         'Accept-Language': 'en-US,en;q=0.9,ru;q=0.8', | ||||
|         'authorization': 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJjbGllbnROYW1lIjoid2ViYXBwLXYzMSIsInNjb3BlIjoic3RhdGljLWNvbnRlbnQtYXBpLGN1cmF0aW9uLWFwaSxuZXh4LWNvbnRlbnQtYXBpLXYzMSx3ZWJhcHAtYXBpIn0.mbuG9wS9Yf5q6PqgR4fiaRFIagiHk9JhwoKES7ksVX4', | ||||
|     } | ||||
|     _AUTH = 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJjbGllbnROYW1lIjoid2ViYXBwLXYzMSIsInNjb3BlIjoic3RhdGljLWNvbnRlbnQtYXBpLGN1cmF0aW9uLWFwaSxuZXh4LWNvbnRlbnQtYXBpLXYzMSx3ZWJhcHAtYXBpIn0.mbuG9wS9Yf5q6PqgR4fiaRFIagiHk9JhwoKES7ksVX4' | ||||
|  | ||||
|     @staticmethod | ||||
|     def _make_headers(referer): | ||||
|         headers = FunkBaseIE._HEADERS.copy() | ||||
|         headers['Referer'] = referer | ||||
|         return headers | ||||
|  | ||||
|     def _make_url_result(self, video): | ||||
|         return { | ||||
|             '_type': 'url_transparent', | ||||
|             'url': 'nexx:741:%s' % video['sourceId'], | ||||
|             'ie_key': NexxIE.ie_key(), | ||||
|             'id': video['sourceId'], | ||||
|             'title': video.get('title'), | ||||
|             'description': video.get('description'), | ||||
|             'duration': int_or_none(video.get('duration')), | ||||
|             'season_number': int_or_none(video.get('seasonNr')), | ||||
|             'episode_number': int_or_none(video.get('episodeNr')), | ||||
|         } | ||||
|  | ||||
|  | ||||
| class FunkMixIE(FunkBaseIE): | ||||
|     _VALID_URL = r'https?://(?:www\.)?funk\.net/mix/(?P<id>[^/]+)/(?P<alias>[^/?#&]+)' | ||||
| class FunkIE(InfoExtractor): | ||||
|     _VALID_URL = r'https?://(?:www\.)?funk\.net/(?:channel|playlist)/[^/]+/(?P<display_id>[0-9a-z-]+)-(?P<id>\d+)' | ||||
|     _TESTS = [{ | ||||
|         'url': 'https://www.funk.net/mix/59d65d935f8b160001828b5b/die-realste-kifferdoku-aller-zeiten', | ||||
|         'md5': '8edf617c2f2b7c9847dfda313f199009', | ||||
|         'info_dict': { | ||||
|             'id': '123748', | ||||
|             'ext': 'mp4', | ||||
|             'title': '"Die realste Kifferdoku aller Zeiten"', | ||||
|             'description': 'md5:c97160f5bafa8d47ec8e2e461012aa9d', | ||||
|             'timestamp': 1490274721, | ||||
|             'upload_date': '20170323', | ||||
|         }, | ||||
|     }] | ||||
|  | ||||
|     def _real_extract(self, url): | ||||
|         mobj = re.match(self._VALID_URL, url) | ||||
|         mix_id = mobj.group('id') | ||||
|         alias = mobj.group('alias') | ||||
|  | ||||
|         lists = self._download_json( | ||||
|             'https://www.funk.net/api/v3.1/curation/curatedLists/', | ||||
|             mix_id, headers=self._make_headers(url), query={ | ||||
|                 'size': 100, | ||||
|             })['_embedded']['curatedListList'] | ||||
|  | ||||
|         metas = next( | ||||
|             l for l in lists | ||||
|             if mix_id in (l.get('entityId'), l.get('alias')))['videoMetas'] | ||||
|         video = next( | ||||
|             meta['videoDataDelegate'] | ||||
|             for meta in metas | ||||
|             if try_get( | ||||
|                 meta, lambda x: x['videoDataDelegate']['alias'], | ||||
|                 compat_str) == alias) | ||||
|  | ||||
|         return self._make_url_result(video) | ||||
|  | ||||
|  | ||||
| class FunkChannelIE(FunkBaseIE): | ||||
|     _VALID_URL = r'https?://(?:www\.)?funk\.net/channel/(?P<id>[^/]+)/(?P<alias>[^/?#&]+)' | ||||
|     _TESTS = [{ | ||||
|         'url': 'https://www.funk.net/channel/ba/die-lustigsten-instrumente-aus-dem-internet-teil-2', | ||||
|         'url': 'https://www.funk.net/channel/ba-793/die-lustigsten-instrumente-aus-dem-internet-teil-2-1155821', | ||||
|         'md5': '8dd9d9ab59b4aa4173b3197f2ea48e81', | ||||
|         'info_dict': { | ||||
|             'id': '1155821', | ||||
|             'ext': 'mp4', | ||||
| @@ -92,83 +24,26 @@ class FunkChannelIE(FunkBaseIE): | ||||
|             'timestamp': 1514507395, | ||||
|             'upload_date': '20171229', | ||||
|         }, | ||||
|         'params': { | ||||
|             'skip_download': True, | ||||
|         }, | ||||
|  | ||||
|     }, { | ||||
|         # only available via byIdList API | ||||
|         'url': 'https://www.funk.net/channel/informr/martin-sonneborn-erklaert-die-eu', | ||||
|         'info_dict': { | ||||
|             'id': '205067', | ||||
|             'ext': 'mp4', | ||||
|             'title': 'Martin Sonneborn erklärt die EU', | ||||
|             'description': 'md5:050f74626e4ed87edf4626d2024210c0', | ||||
|             'timestamp': 1494424042, | ||||
|             'upload_date': '20170510', | ||||
|         }, | ||||
|         'params': { | ||||
|             'skip_download': True, | ||||
|         }, | ||||
|     }, { | ||||
|         'url': 'https://www.funk.net/channel/59d5149841dca100012511e3/mein-erster-job-lovemilla-folge-1/lovemilla/', | ||||
|         'url': 'https://www.funk.net/playlist/neuesteVideos/kameras-auf-dem-fusion-festival-1618699', | ||||
|         'only_matching': True, | ||||
|     }] | ||||
|  | ||||
|     def _real_extract(self, url): | ||||
|         mobj = re.match(self._VALID_URL, url) | ||||
|         channel_id = mobj.group('id') | ||||
|         alias = mobj.group('alias') | ||||
|  | ||||
|         headers = self._make_headers(url) | ||||
|  | ||||
|         video = None | ||||
|  | ||||
|         # Id-based channels are currently broken on their side: webplayer | ||||
|         # tries to process them via byChannelAlias endpoint and fails | ||||
|         # predictably. | ||||
|         for page_num in itertools.count(): | ||||
|             by_channel_alias = self._download_json( | ||||
|                 'https://www.funk.net/api/v3.1/webapp/videos/byChannelAlias/%s' | ||||
|                 % channel_id, | ||||
|                 'Downloading byChannelAlias JSON page %d' % (page_num + 1), | ||||
|                 headers=headers, query={ | ||||
|                     'filterFsk': 'false', | ||||
|                     'sort': 'creationDate,desc', | ||||
|                     'size': 100, | ||||
|                     'page': page_num, | ||||
|                 }, fatal=False) | ||||
|             if not by_channel_alias: | ||||
|                 break | ||||
|             video_list = try_get( | ||||
|                 by_channel_alias, lambda x: x['_embedded']['videoList'], list) | ||||
|             if not video_list: | ||||
|                 break | ||||
|             try: | ||||
|                 video = next(r for r in video_list if r.get('alias') == alias) | ||||
|                 break | ||||
|             except StopIteration: | ||||
|                 pass | ||||
|             if not try_get( | ||||
|                     by_channel_alias, lambda x: x['_links']['next']): | ||||
|                 break | ||||
|  | ||||
|         if not video: | ||||
|             by_id_list = self._download_json( | ||||
|                 'https://www.funk.net/api/v3.0/content/videos/byIdList', | ||||
|                 channel_id, 'Downloading byIdList JSON', headers=headers, | ||||
|                 query={ | ||||
|                     'ids': alias, | ||||
|                 }, fatal=False) | ||||
|             if by_id_list: | ||||
|                 video = try_get(by_id_list, lambda x: x['result'][0], dict) | ||||
|  | ||||
|         if not video: | ||||
|             results = self._download_json( | ||||
|                 'https://www.funk.net/api/v3.0/content/videos/filter', | ||||
|                 channel_id, 'Downloading filter JSON', headers=headers, query={ | ||||
|                     'channelId': channel_id, | ||||
|                     'size': 100, | ||||
|                 })['result'] | ||||
|             video = next(r for r in results if r.get('alias') == alias) | ||||
|  | ||||
|         return self._make_url_result(video) | ||||
|         display_id, nexx_id = re.match(self._VALID_URL, url).groups() | ||||
|         video = self._download_json( | ||||
|             'https://www.funk.net/api/v4.0/videos/' + nexx_id, nexx_id) | ||||
|         return { | ||||
|             '_type': 'url_transparent', | ||||
|             'url': 'nexx:741:' + nexx_id, | ||||
|             'ie_key': NexxIE.ie_key(), | ||||
|             'id': nexx_id, | ||||
|             'title': video.get('title'), | ||||
|             'description': video.get('description'), | ||||
|             'duration': int_or_none(video.get('duration')), | ||||
|             'channel_id': str_or_none(video.get('channelId')), | ||||
|             'display_id': display_id, | ||||
|             'tags': video.get('tags'), | ||||
|             'thumbnail': video.get('imageUrlLandscape'), | ||||
|         } | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Remita Amine
					Remita Amine