mirror of
				https://github.com/yt-dlp/yt-dlp.git
				synced 2025-10-31 06:35:12 +00:00 
			
		
		
		
	Add support for drtuber.com
This commit is contained in:
		
							
								
								
									
										48
									
								
								youtube_dl/extractor/drtuber.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										48
									
								
								youtube_dl/extractor/drtuber.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,48 @@ | ||||
| from __future__ import unicode_literals | ||||
|  | ||||
| import re | ||||
|  | ||||
| from .common import InfoExtractor | ||||
|  | ||||
|  | ||||
| class DrTuberIE(InfoExtractor): | ||||
|     _VALID_URL = r'https?://(?:www\.)?drtuber\.com/video/(?P<id>\d+)/(?P<title_dash>[\w-]+)' | ||||
|     _TEST = { | ||||
|         'url': 'http://www.drtuber.com/video/1740434/hot-perky-blonde-naked-golf', | ||||
|         'md5': '93e680cf2536ad0dfb7e74d94a89facd', | ||||
|         'info_dict': { | ||||
|             'id': '1740434', | ||||
|             'ext': 'mp4', | ||||
|             'title': 'Hot Perky Blonde Naked Golf', | ||||
|             'categories': list,  # NSFW | ||||
|             'thumbnail': 're:https?://.*\.jpg$', | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     def _real_extract(self, url): | ||||
|         mobj = re.match(self._VALID_URL, url) | ||||
|         video_id = mobj.group('id') | ||||
|  | ||||
|         webpage = self._download_webpage(url, video_id) | ||||
|  | ||||
|         video_url = self._html_search_regex( | ||||
|             r'<source src="([^"]+)"', webpage, 'video URL') | ||||
|  | ||||
|         title = self._html_search_regex( | ||||
|             r'<title>([^<]+)\s*-\s*Free', webpage, 'title') | ||||
|  | ||||
|         thumbnail = self._html_search_regex( | ||||
|             r'poster="([^"]+)"', | ||||
|             webpage, 'thumbnail', fatal=False) | ||||
|  | ||||
|         categories_str = self._html_search_regex( | ||||
|             r'<meta name="keywords" content="([^"]+)"', webpage, 'categories', fatal=False) | ||||
|         categories = categories_str.split(' ') | ||||
|  | ||||
|         return { | ||||
|             'id': video_id, | ||||
|             'url': video_url, | ||||
|             'title': title, | ||||
|             'thumbnail': thumbnail, | ||||
|             'categories': categories, | ||||
|         } | ||||
		Reference in New Issue
	
	Block a user
	 peugeot
					peugeot