From 4ffba17e1a750d6be030ee4ea7b9d132f2ca0e74 Mon Sep 17 00:00:00 2001 From: Nikolay Fedorov <40500428+swayll@users.noreply.github.com> Date: Fri, 20 Jun 2025 23:02:43 +0300 Subject: [PATCH] A simpler and more compact way to get embed_url and embed_page at yt_dlp/extractor/thehighwire.py Co-authored-by: doe1080 <98906116+doe1080@users.noreply.github.com> --- yt_dlp/extractor/thehighwire.py | 13 ++++--------- 1 file changed, 4 insertions(+), 9 deletions(-) diff --git a/yt_dlp/extractor/thehighwire.py b/yt_dlp/extractor/thehighwire.py index ffd86f91e..9691910f8 100644 --- a/yt_dlp/extractor/thehighwire.py +++ b/yt_dlp/extractor/thehighwire.py @@ -17,15 +17,10 @@ def _real_extract(self, url): display_id = self._match_id(url) webpage = self._download_webpage(url, display_id) - iframe_url = self._search_regex( - r']+src=["\'](https?://app\.arkengine\.com/embed/[^"\']+)', - webpage, 'iframe URL') - video_id = self._search_regex( - r'embed/([a-zA-Z0-9]+)', iframe_url, 'video ID') - - player_page = self._download_webpage( - self._EMBED_URL.format(id=video_id), video_id, - note='Downloading player page') + embed_url = traverse_obj(webpage, ( + {find_element(cls='ark-video-embed', html=True)}, + {extract_attributes}, 'src', {url_or_none}, {require('embed URL')})) + embed_page = self._download_webpage(embed_url, display_id) m3u8_url = self._search_regex( r']+src=["\']([^"\']+\.m3u8)',