mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-30 22:25:19 +00:00 
			
		
		
		
	[cspan] Make ‘www’ optional and improve the regex for extracting the id (fixes #2194)
This commit is contained in:
		| @@ -10,7 +10,7 @@ from ..utils import ( | ||||
|  | ||||
|  | ||||
| class CSpanIE(InfoExtractor): | ||||
|     _VALID_URL = r'http://www\.c-spanvideo\.org/program/(.*)' | ||||
|     _VALID_URL = r'http://(?:www\.)?c-spanvideo\.org/program/(?P<name>.*)' | ||||
|     IE_DESC = 'C-SPAN' | ||||
|     _TEST = { | ||||
|         'url': 'http://www.c-spanvideo.org/program/HolderonV', | ||||
| @@ -24,9 +24,9 @@ class CSpanIE(InfoExtractor): | ||||
|  | ||||
|     def _real_extract(self, url): | ||||
|         mobj = re.match(self._VALID_URL, url) | ||||
|         prog_name = mobj.group(1) | ||||
|         prog_name = mobj.group('name') | ||||
|         webpage = self._download_webpage(url, prog_name) | ||||
|         video_id = self._search_regex(r'programid=(.*?)&', webpage, 'video id') | ||||
|         video_id = self._search_regex(r'prog(?:ram)?id=(.*?)&', webpage, 'video id') | ||||
|  | ||||
|         title = self._html_search_regex( | ||||
|             r'<!-- title -->\n\s*<h1[^>]*>(.*?)</h1>', webpage, 'title') | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Jaime Marquínez Ferrándiz
					Jaime Marquínez Ferrándiz