mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-31 14:45:14 +00:00 
			
		
		
		
	[funk] fix extraction(closes #17915)
This commit is contained in:
		| @@ -1,89 +1,21 @@ | |||||||
| # coding: utf-8 | # coding: utf-8 | ||||||
| from __future__ import unicode_literals | from __future__ import unicode_literals | ||||||
|  |  | ||||||
| import itertools |  | ||||||
| import re | import re | ||||||
|  |  | ||||||
| from .common import InfoExtractor | from .common import InfoExtractor | ||||||
| from .nexx import NexxIE | from .nexx import NexxIE | ||||||
| from ..compat import compat_str |  | ||||||
| from ..utils import ( | from ..utils import ( | ||||||
|     int_or_none, |     int_or_none, | ||||||
|     try_get, |     str_or_none, | ||||||
| ) | ) | ||||||
|  |  | ||||||
|  |  | ||||||
| class FunkBaseIE(InfoExtractor): | class FunkIE(InfoExtractor): | ||||||
|     _HEADERS = { |     _VALID_URL = r'https?://(?:www\.)?funk\.net/(?:channel|playlist)/[^/]+/(?P<display_id>[0-9a-z-]+)-(?P<id>\d+)' | ||||||
|         'Accept': '*/*', |  | ||||||
|         'Accept-Language': 'en-US,en;q=0.9,ru;q=0.8', |  | ||||||
|         'authorization': 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJjbGllbnROYW1lIjoid2ViYXBwLXYzMSIsInNjb3BlIjoic3RhdGljLWNvbnRlbnQtYXBpLGN1cmF0aW9uLWFwaSxuZXh4LWNvbnRlbnQtYXBpLXYzMSx3ZWJhcHAtYXBpIn0.mbuG9wS9Yf5q6PqgR4fiaRFIagiHk9JhwoKES7ksVX4', |  | ||||||
|     } |  | ||||||
|     _AUTH = 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJjbGllbnROYW1lIjoid2ViYXBwLXYzMSIsInNjb3BlIjoic3RhdGljLWNvbnRlbnQtYXBpLGN1cmF0aW9uLWFwaSxuZXh4LWNvbnRlbnQtYXBpLXYzMSx3ZWJhcHAtYXBpIn0.mbuG9wS9Yf5q6PqgR4fiaRFIagiHk9JhwoKES7ksVX4' |  | ||||||
|  |  | ||||||
|     @staticmethod |  | ||||||
|     def _make_headers(referer): |  | ||||||
|         headers = FunkBaseIE._HEADERS.copy() |  | ||||||
|         headers['Referer'] = referer |  | ||||||
|         return headers |  | ||||||
|  |  | ||||||
|     def _make_url_result(self, video): |  | ||||||
|         return { |  | ||||||
|             '_type': 'url_transparent', |  | ||||||
|             'url': 'nexx:741:%s' % video['sourceId'], |  | ||||||
|             'ie_key': NexxIE.ie_key(), |  | ||||||
|             'id': video['sourceId'], |  | ||||||
|             'title': video.get('title'), |  | ||||||
|             'description': video.get('description'), |  | ||||||
|             'duration': int_or_none(video.get('duration')), |  | ||||||
|             'season_number': int_or_none(video.get('seasonNr')), |  | ||||||
|             'episode_number': int_or_none(video.get('episodeNr')), |  | ||||||
|         } |  | ||||||
|  |  | ||||||
|  |  | ||||||
| class FunkMixIE(FunkBaseIE): |  | ||||||
|     _VALID_URL = r'https?://(?:www\.)?funk\.net/mix/(?P<id>[^/]+)/(?P<alias>[^/?#&]+)' |  | ||||||
|     _TESTS = [{ |     _TESTS = [{ | ||||||
|         'url': 'https://www.funk.net/mix/59d65d935f8b160001828b5b/die-realste-kifferdoku-aller-zeiten', |         'url': 'https://www.funk.net/channel/ba-793/die-lustigsten-instrumente-aus-dem-internet-teil-2-1155821', | ||||||
|         'md5': '8edf617c2f2b7c9847dfda313f199009', |         'md5': '8dd9d9ab59b4aa4173b3197f2ea48e81', | ||||||
|         'info_dict': { |  | ||||||
|             'id': '123748', |  | ||||||
|             'ext': 'mp4', |  | ||||||
|             'title': '"Die realste Kifferdoku aller Zeiten"', |  | ||||||
|             'description': 'md5:c97160f5bafa8d47ec8e2e461012aa9d', |  | ||||||
|             'timestamp': 1490274721, |  | ||||||
|             'upload_date': '20170323', |  | ||||||
|         }, |  | ||||||
|     }] |  | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |  | ||||||
|         mobj = re.match(self._VALID_URL, url) |  | ||||||
|         mix_id = mobj.group('id') |  | ||||||
|         alias = mobj.group('alias') |  | ||||||
|  |  | ||||||
|         lists = self._download_json( |  | ||||||
|             'https://www.funk.net/api/v3.1/curation/curatedLists/', |  | ||||||
|             mix_id, headers=self._make_headers(url), query={ |  | ||||||
|                 'size': 100, |  | ||||||
|             })['_embedded']['curatedListList'] |  | ||||||
|  |  | ||||||
|         metas = next( |  | ||||||
|             l for l in lists |  | ||||||
|             if mix_id in (l.get('entityId'), l.get('alias')))['videoMetas'] |  | ||||||
|         video = next( |  | ||||||
|             meta['videoDataDelegate'] |  | ||||||
|             for meta in metas |  | ||||||
|             if try_get( |  | ||||||
|                 meta, lambda x: x['videoDataDelegate']['alias'], |  | ||||||
|                 compat_str) == alias) |  | ||||||
|  |  | ||||||
|         return self._make_url_result(video) |  | ||||||
|  |  | ||||||
|  |  | ||||||
| class FunkChannelIE(FunkBaseIE): |  | ||||||
|     _VALID_URL = r'https?://(?:www\.)?funk\.net/channel/(?P<id>[^/]+)/(?P<alias>[^/?#&]+)' |  | ||||||
|     _TESTS = [{ |  | ||||||
|         'url': 'https://www.funk.net/channel/ba/die-lustigsten-instrumente-aus-dem-internet-teil-2', |  | ||||||
|         'info_dict': { |         'info_dict': { | ||||||
|             'id': '1155821', |             'id': '1155821', | ||||||
|             'ext': 'mp4', |             'ext': 'mp4', | ||||||
| @@ -92,83 +24,26 @@ class FunkChannelIE(FunkBaseIE): | |||||||
|             'timestamp': 1514507395, |             'timestamp': 1514507395, | ||||||
|             'upload_date': '20171229', |             'upload_date': '20171229', | ||||||
|         }, |         }, | ||||||
|         'params': { |  | ||||||
|             'skip_download': True, |  | ||||||
|         }, |  | ||||||
|     }, { |     }, { | ||||||
|         # only available via byIdList API |         'url': 'https://www.funk.net/playlist/neuesteVideos/kameras-auf-dem-fusion-festival-1618699', | ||||||
|         'url': 'https://www.funk.net/channel/informr/martin-sonneborn-erklaert-die-eu', |  | ||||||
|         'info_dict': { |  | ||||||
|             'id': '205067', |  | ||||||
|             'ext': 'mp4', |  | ||||||
|             'title': 'Martin Sonneborn erklärt die EU', |  | ||||||
|             'description': 'md5:050f74626e4ed87edf4626d2024210c0', |  | ||||||
|             'timestamp': 1494424042, |  | ||||||
|             'upload_date': '20170510', |  | ||||||
|         }, |  | ||||||
|         'params': { |  | ||||||
|             'skip_download': True, |  | ||||||
|         }, |  | ||||||
|     }, { |  | ||||||
|         'url': 'https://www.funk.net/channel/59d5149841dca100012511e3/mein-erster-job-lovemilla-folge-1/lovemilla/', |  | ||||||
|         'only_matching': True, |         'only_matching': True, | ||||||
|     }] |     }] | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
|         mobj = re.match(self._VALID_URL, url) |         display_id, nexx_id = re.match(self._VALID_URL, url).groups() | ||||||
|         channel_id = mobj.group('id') |         video = self._download_json( | ||||||
|         alias = mobj.group('alias') |             'https://www.funk.net/api/v4.0/videos/' + nexx_id, nexx_id) | ||||||
|  |         return { | ||||||
|         headers = self._make_headers(url) |             '_type': 'url_transparent', | ||||||
|  |             'url': 'nexx:741:' + nexx_id, | ||||||
|         video = None |             'ie_key': NexxIE.ie_key(), | ||||||
|  |             'id': nexx_id, | ||||||
|         # Id-based channels are currently broken on their side: webplayer |             'title': video.get('title'), | ||||||
|         # tries to process them via byChannelAlias endpoint and fails |             'description': video.get('description'), | ||||||
|         # predictably. |             'duration': int_or_none(video.get('duration')), | ||||||
|         for page_num in itertools.count(): |             'channel_id': str_or_none(video.get('channelId')), | ||||||
|             by_channel_alias = self._download_json( |             'display_id': display_id, | ||||||
|                 'https://www.funk.net/api/v3.1/webapp/videos/byChannelAlias/%s' |             'tags': video.get('tags'), | ||||||
|                 % channel_id, |             'thumbnail': video.get('imageUrlLandscape'), | ||||||
|                 'Downloading byChannelAlias JSON page %d' % (page_num + 1), |         } | ||||||
|                 headers=headers, query={ |  | ||||||
|                     'filterFsk': 'false', |  | ||||||
|                     'sort': 'creationDate,desc', |  | ||||||
|                     'size': 100, |  | ||||||
|                     'page': page_num, |  | ||||||
|                 }, fatal=False) |  | ||||||
|             if not by_channel_alias: |  | ||||||
|                 break |  | ||||||
|             video_list = try_get( |  | ||||||
|                 by_channel_alias, lambda x: x['_embedded']['videoList'], list) |  | ||||||
|             if not video_list: |  | ||||||
|                 break |  | ||||||
|             try: |  | ||||||
|                 video = next(r for r in video_list if r.get('alias') == alias) |  | ||||||
|                 break |  | ||||||
|             except StopIteration: |  | ||||||
|                 pass |  | ||||||
|             if not try_get( |  | ||||||
|                     by_channel_alias, lambda x: x['_links']['next']): |  | ||||||
|                 break |  | ||||||
|  |  | ||||||
|         if not video: |  | ||||||
|             by_id_list = self._download_json( |  | ||||||
|                 'https://www.funk.net/api/v3.0/content/videos/byIdList', |  | ||||||
|                 channel_id, 'Downloading byIdList JSON', headers=headers, |  | ||||||
|                 query={ |  | ||||||
|                     'ids': alias, |  | ||||||
|                 }, fatal=False) |  | ||||||
|             if by_id_list: |  | ||||||
|                 video = try_get(by_id_list, lambda x: x['result'][0], dict) |  | ||||||
|  |  | ||||||
|         if not video: |  | ||||||
|             results = self._download_json( |  | ||||||
|                 'https://www.funk.net/api/v3.0/content/videos/filter', |  | ||||||
|                 channel_id, 'Downloading filter JSON', headers=headers, query={ |  | ||||||
|                     'channelId': channel_id, |  | ||||||
|                     'size': 100, |  | ||||||
|                 })['result'] |  | ||||||
|             video = next(r for r in results if r.get('alias') == alias) |  | ||||||
|  |  | ||||||
|         return self._make_url_result(video) |  | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Remita Amine
					Remita Amine