mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-31 14:45:14 +00:00 
			
		
		
		
	[teachertube] Fix title and playlist recognition
This commit is contained in:
		| @@ -469,7 +469,7 @@ class InfoExtractor(object): | |||||||
|             display_name = name |             display_name = name | ||||||
|         return self._html_search_regex( |         return self._html_search_regex( | ||||||
|             r'''(?ix)<meta |             r'''(?ix)<meta | ||||||
|                     (?=[^>]+(?:itemprop|name|property)=["\']%s["\']) |                     (?=[^>]+(?:itemprop|name|property)=["\']?%s["\']?) | ||||||
|                     [^>]+content=["\']([^"\']+)["\']''' % re.escape(name), |                     [^>]+content=["\']([^"\']+)["\']''' % re.escape(name), | ||||||
|             html, display_name, fatal=fatal, **kwargs) |             html, display_name, fatal=fatal, **kwargs) | ||||||
|  |  | ||||||
|   | |||||||
| @@ -62,7 +62,7 @@ class TeacherTubeIE(InfoExtractor): | |||||||
|  |  | ||||||
|         webpage = self._download_webpage(url, video_id) |         webpage = self._download_webpage(url, video_id) | ||||||
|  |  | ||||||
|         title = self._html_search_meta('title', webpage, 'title') |         title = self._html_search_meta('title', webpage, 'title', fatal=True) | ||||||
|         TITLE_SUFFIX = ' - TeacherTube' |         TITLE_SUFFIX = ' - TeacherTube' | ||||||
|         if title.endswith(TITLE_SUFFIX): |         if title.endswith(TITLE_SUFFIX): | ||||||
|             title = title[:-len(TITLE_SUFFIX)].strip() |             title = title[:-len(TITLE_SUFFIX)].strip() | ||||||
| @@ -101,7 +101,11 @@ class TeacherTubeUserIE(InfoExtractor): | |||||||
|  |  | ||||||
|     _VALID_URL = r'https?://(?:www\.)?teachertube\.com/(user/profile|collection)/(?P<user>[0-9a-zA-Z]+)/?' |     _VALID_URL = r'https?://(?:www\.)?teachertube\.com/(user/profile|collection)/(?P<user>[0-9a-zA-Z]+)/?' | ||||||
|  |  | ||||||
|     _MEDIA_RE = r'(?s)"sidebar_thumb_time">[0-9:]+</div>.+?<a href="(https?://(?:www\.)?teachertube\.com/(?:video|audio)/[^"]+)">' |     _MEDIA_RE = r'''(?sx) | ||||||
|  |         class="?sidebar_thumb_time"?>[0-9:]+</div> | ||||||
|  |         \s* | ||||||
|  |         <a\s+href="(https?://(?:www\.)?teachertube\.com/(?:video|audio)/[^"]+)" | ||||||
|  |     ''' | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
|         mobj = re.match(self._VALID_URL, url) |         mobj = re.match(self._VALID_URL, url) | ||||||
| @@ -111,14 +115,12 @@ class TeacherTubeUserIE(InfoExtractor): | |||||||
|         webpage = self._download_webpage(url, user_id) |         webpage = self._download_webpage(url, user_id) | ||||||
|         urls.extend(re.findall(self._MEDIA_RE, webpage)) |         urls.extend(re.findall(self._MEDIA_RE, webpage)) | ||||||
|          |          | ||||||
|         pages = re.findall(r'/ajax-user/user-videos/%s\?page=([0-9]+)' % user_id, webpage)[1:-1] |         pages = re.findall(r'/ajax-user/user-videos/%s\?page=([0-9]+)' % user_id, webpage)[:-1] | ||||||
|         for p in pages: |         for p in pages: | ||||||
|             more = 'http://www.teachertube.com/ajax-user/user-videos/%s?page=%s' % (user_id, p) |             more = 'http://www.teachertube.com/ajax-user/user-videos/%s?page=%s' % (user_id, p) | ||||||
|             webpage = self._download_webpage(more, user_id, 'Downloading page %s/%s' % (p, len(pages) + 1)) |             webpage = self._download_webpage(more, user_id, 'Downloading page %s/%s' % (p, len(pages))) | ||||||
|             urls.extend(re.findall(self._MEDIA_RE, webpage)) |             video_urls = re.findall(self._MEDIA_RE, webpage) | ||||||
|  |             urls.extend(video_urls) | ||||||
|         entries = [] |  | ||||||
|         for url in urls: |  | ||||||
|             entries.append(self.url_result(url, 'TeacherTube')) |  | ||||||
|  |  | ||||||
|  |         entries = [self.url_result(vurl, 'TeacherTube') for vurl in urls] | ||||||
|         return self.playlist_result(entries, user_id) |         return self.playlist_result(entries, user_id) | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Philipp Hagemeister
					Philipp Hagemeister