mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-31 22:55:18 +00:00 
			
		
		
		
	[extractor/common] Speed-up media tags regex (closes #11979)
This commit is contained in:
		| @@ -1959,7 +1959,12 @@ class InfoExtractor(object): | |||||||
|         media_tags = [(media_tag, media_type, '') |         media_tags = [(media_tag, media_type, '') | ||||||
|                       for media_tag, media_type |                       for media_tag, media_type | ||||||
|                       in re.findall(r'(?s)(<(video|audio)[^>]*/>)', webpage)] |                       in re.findall(r'(?s)(<(video|audio)[^>]*/>)', webpage)] | ||||||
|         media_tags.extend(re.findall(r'(?s)(<(?P<tag>video|audio)[^>]*>)(.*?)</(?P=tag)>', webpage)) |         media_tags.extend(re.findall( | ||||||
|  |             # We only allow video|audio followed by a whitespace or '>'. | ||||||
|  |             # Allowing more characters may end up in significant slow down (see | ||||||
|  |             # https://github.com/rg3/youtube-dl/issues/11979, example URL: | ||||||
|  |             # http://www.porntrex.com/maps/videositemap.xml). | ||||||
|  |             r'(?s)(<(?P<tag>video|audio)(?:\s+[^>]*)?>)(.*?)</(?P=tag)>', webpage)) | ||||||
|         for media_tag, media_type, media_content in media_tags: |         for media_tag, media_type, media_content in media_tags: | ||||||
|             media_info = { |             media_info = { | ||||||
|                 'formats': [], |                 'formats': [], | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Sergey M․
					Sergey M․