1
0
mirror of https://github.com/yt-dlp/yt-dlp.git synced 2025-08-18 10:28:29 +00:00

refactor: use api for extraction

This commit is contained in:
JChris246 2025-03-17 22:47:48 -04:00
parent 1dd3d4190d
commit e13730aefa

View File

@ -1,5 +1,11 @@
import random
from .common import InfoExtractor from .common import InfoExtractor
from ..utils import ExtractorError, UserNotLive from ..utils import (
ExtractorError,
UserNotLive,
traverse_obj,
)
class MyFreeCamsIE(InfoExtractor): class MyFreeCamsIE(InfoExtractor):
@ -51,12 +57,12 @@ class MyFreeCamsIE(InfoExtractor):
def get_required_params(self, webpage): def get_required_params(self, webpage):
sid = self._search_regex( sid = self._search_regex(
[r'data-campreview-sid=["\'](\d+)["\']', r'data-cam-preview-server-id-value=["\'](\d+)["\']'], [r'data-campreview-sid=["\'](\d+)["\']', r'data-cam-preview-server-id-value=["\'](\d+)["\']'],
webpage, 'sid', webpage, 'sid', fatal=False
) )
mid = self._search_regex( mid = self._search_regex(
[r'data-campreview-mid=["\'](\d+)["\']', r'data-cam-preview-model-id-value=["\'](\d+)["\']'], [r'data-campreview-mid=["\'](\d+)["\']', r'data-cam-preview-model-id-value=["\'](\d+)["\']'],
webpage, 'mid', webpage, 'mid', fatal=False
) )
webrtc = self._search_regex( webrtc = self._search_regex(
@ -66,19 +72,21 @@ def get_required_params(self, webpage):
snap_url = self._search_regex( snap_url = self._search_regex(
r'data-cam-preview-snap-url-value=["\']([^"\']+)["\']', r'data-cam-preview-snap-url-value=["\']([^"\']+)["\']',
webpage, 'snap_url', webpage, 'snap_url', default=''
) )
webrtc = 'true' if 'mfc_a_' in snap_url else 'false' webrtc = 'true' if 'mfc_a_' in snap_url else 'false'
if not sid or not mid:
return {}
return { return {
'sid': sid, 'sid': sid,
'mid': str(int(mid) + 100_000_000), 'mid': str(int(mid) + 100_000_000),
'a': 'a_' if webrtc == 'true' else '', 'a': 'a_' if webrtc == 'true' else '',
} }
def _real_extract(self, url): def webpage_extraction(self, video_id):
video_id = self._match_id(url)
webpage = self._download_webpage('https://share.myfreecams.com/' + video_id, video_id) webpage = self._download_webpage('https://share.myfreecams.com/' + video_id, video_id)
if not self._search_regex(r'https://www.myfreecams.com/php/tracking.php\?[^\'"]*model_id=(\d+)[^\'"]*', if not self._search_regex(r'https://www.myfreecams.com/php/tracking.php\?[^\'"]*model_id=(\d+)[^\'"]*',
@ -86,7 +94,7 @@ def _real_extract(self, url):
raise ExtractorError('Model not found') raise ExtractorError('Model not found')
params = self.get_required_params(webpage) params = self.get_required_params(webpage)
if not params['sid']: if not params.get('sid'):
raise UserNotLive('Model offline') raise UserNotLive('Model offline')
return { return {
@ -99,3 +107,70 @@ def _real_extract(self, url):
'age_limit': 18, 'age_limit': 18,
'thumbnail': self._search_regex(r'(https?://img\.mfcimg\.com/photos2?/\d+/\d+/avatar\.\d+x\d+.jpg(?:\?nc=\d+)?)', webpage, 'thumbnail', fatal=False), 'thumbnail': self._search_regex(r'(https?://img\.mfcimg\.com/photos2?/\d+/\d+/avatar\.\d+x\d+.jpg(?:\?nc=\d+)?)', webpage, 'thumbnail', fatal=False),
} }
def _real_extract(self, url):
video_id = self._match_id(url)
user_data = self._download_json(
'https://api-edge.myfreecams.com/usernameLookup/' + video_id, video_id)
if not user_data:
self.report_warning('Unable to get user data from api, falling back to webpage extraction')
return self.webpage_extraction(video_id)
user = traverse_obj(user_data, ('result', 'user'))
if not user:
raise ExtractorError('Model ' + video_id + ' not found')
if not user.get('id'):
raise ExtractorError('Model ' + video_id + ' id not found')
if user.get('access_level') != 4:
raise ExtractorError('User ' + video_id + ' is not a model')
status = user.get('vs')
if status is None:
raise UserNotLive('Model ' + video_id + ' offline', expected=True)
user_sessions = user.get('sessions')
if not user_sessions or len(user_sessions) < 1:
self.report_warning('Unable to get user sessions from api, falling back to webpage extraction')
return self.webpage_extraction(video_id)
session = next((item for item in user_sessions if item.get('server_name')), None)
if session is None:
self.report_warning('Unable to get valid user session from api, falling back to webpage extraction')
return self.webpage_extraction(video_id)
vs = session.get('vstate')
ok_vs = [0, 90]
if vs not in ok_vs:
if vs == 127:
raise UserNotLive('Model ' + video_id + ' is offline', expected=True)
elif vs == 12:
raise ExtractorError('Model ' + video_id + ' is in a private show', expected=True)
elif vs == 13:
raise ExtractorError('Model ' + video_id + ' is in a group show', expected=True)
elif vs == 2:
raise ExtractorError('Model ' + video_id + ' is away', expected=True)
else:
raise ExtractorError('Unknown status ' + str(vs) + ' for model ' + video_id)
server_id = session.get('server_name')[5:]
phase = session.get('phase')
mid = int(user.get('id')) + 100_000_000
rand_val = random.random()
formats = self._extract_m3u8_formats(
f'https://edgevideo.myfreecams.com/llhls/NxServer/{server_id}/ngrp:mfc_{phase}{mid}.f4v_cmaf/playlist_sfm4s.m3u8?nc={rand_val}&v=1.97.23',
video_id, 'mp4', live=True)
if not formats or len(formats) < 1:
self.report_warning('Unable to stream urls from api, falling back to webpage extraction')
return self.webpage_extraction(video_id)
return {
'id': video_id,
'title': video_id,
'is_live': True,
'formats': formats,
'age_limit': 18,
'thumbnail': user.get('avatar'),
}