mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-31 06:35:12 +00:00 
			
		
		
		
	[srmediathek] improve extraction
This commit is contained in:
		| @@ -1,17 +1,18 @@ | ||||
| # encoding: utf-8 | ||||
| from __future__ import unicode_literals | ||||
|  | ||||
| import json | ||||
|  | ||||
| from .common import InfoExtractor | ||||
| from ..utils import js_to_json | ||||
| from .ard import ARDMediathekIE | ||||
| from ..utils import ( | ||||
|     ExtractorError, | ||||
|     get_element_by_attribute, | ||||
| ) | ||||
|  | ||||
|  | ||||
| class SRMediathekIE(InfoExtractor): | ||||
| class SRMediathekIE(ARDMediathekIE): | ||||
|     IE_DESC = 'Saarländischer Rundfunk' | ||||
|     _VALID_URL = r'https?://sr-mediathek\.sr-online\.de/index\.php\?.*?&id=(?P<id>[0-9]+)' | ||||
|  | ||||
|     _TEST = { | ||||
|     _TESTS = [{ | ||||
|         'url': 'http://sr-mediathek.sr-online.de/index.php?seite=7&id=28455', | ||||
|         'info_dict': { | ||||
|             'id': '28455', | ||||
| @@ -20,24 +21,36 @@ class SRMediathekIE(InfoExtractor): | ||||
|             'description': 'Ringen: KSV Köllerbach gegen Aachen-Walheim; Frauen-Fußball: 1. FC Saarbrücken gegen Sindelfingen; Motorsport: Rallye in Losheim; dazu: Interview mit Timo Bernhard; Turnen: TG Saar; Reitsport: Deutscher Voltigier-Pokal; Badminton: Interview mit Michael Fuchs ', | ||||
|             'thumbnail': 're:^https?://.*\.jpg$', | ||||
|         }, | ||||
|     } | ||||
|         'skip': 'no longer available', | ||||
|     }, { | ||||
|         'url': 'http://sr-mediathek.sr-online.de/index.php?seite=7&id=37682', | ||||
|         'info_dict': { | ||||
|             'id': '37682', | ||||
|             'ext': 'mp4', | ||||
|             'title': 'Love, Cakes and Rock\'n\'Roll', | ||||
|             'description': 'md5:18bf9763631c7d326c22603681e1123d', | ||||
|         }, | ||||
|         'params': { | ||||
|             # m3u8 download | ||||
|             'skip_download': True, | ||||
|         }, | ||||
|         'expected_warnings': ['Unable to download f4m manifest'] | ||||
|     }] | ||||
|  | ||||
|     def _real_extract(self, url): | ||||
|         video_id = self._match_id(url) | ||||
|         webpage = self._download_webpage(url, video_id) | ||||
|  | ||||
|         murls = json.loads(js_to_json(self._search_regex( | ||||
|             r'var mediaURLs\s*=\s*(.*?);\n', webpage, 'video URLs'))) | ||||
|         formats = [{'url': murl} for murl in murls] | ||||
|         self._sort_formats(formats) | ||||
|         if '>Der gewünschte Beitrag ist leider nicht mehr verfügbar.<' in webpage: | ||||
|             raise ExtractorError('Video %s is no longer available' % video_id, expected=True) | ||||
|  | ||||
|         title = json.loads(js_to_json(self._search_regex( | ||||
|             r'var mediaTitles\s*=\s*(.*?);\n', webpage, 'title')))[0] | ||||
|  | ||||
|         return { | ||||
|         media_collection_url = self._search_regex( | ||||
|             r'data-mediacollection-ardplayer="([^"]+)"', webpage, 'media collection url') | ||||
|         info = self._extract_media_info(media_collection_url, webpage, video_id) | ||||
|         info.update({ | ||||
|             'id': video_id, | ||||
|             'title': title, | ||||
|             'formats': formats, | ||||
|             'title': get_element_by_attribute('class', 'ardplayer-title', webpage), | ||||
|             'description': self._og_search_description(webpage), | ||||
|             'thumbnail': self._og_search_thumbnail(webpage), | ||||
|         } | ||||
|         }) | ||||
|         return info | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 remitamine
					remitamine