diff --git a/yt_dlp/extractor/_extractors.py b/yt_dlp/extractor/_extractors.py index 34c98b537..56b518793 100644 --- a/yt_dlp/extractor/_extractors.py +++ b/yt_dlp/extractor/_extractors.py @@ -570,6 +570,7 @@ DWIE, DWArticleIE, ) +from .dzsecurity import DzsecurityLiveIE from .eagleplatform import ( ClipYouEmbedIE, EaglePlatformIE, diff --git a/yt_dlp/extractor/dzsecurity.py b/yt_dlp/extractor/dzsecurity.py new file mode 100644 index 000000000..21f9b65e6 --- /dev/null +++ b/yt_dlp/extractor/dzsecurity.py @@ -0,0 +1,70 @@ +from yt_dlp.extractor.common import InfoExtractor +from yt_dlp.utils import ExtractorError +import re +from urllib.parse import urlparse + + +class DzsecurityLiveIE(InfoExtractor): + _VALID_URL = r'https?://(?:www\.)?(echoroukonline|ennaharonline)\.com/live(?:-news)?' + + _TESTS = [{ + 'url': 'https://www.echoroukonline.com/live', + 'info_dict': { + 'id': 'echorouktv', + 'title': r're:البث الحي لقناة الشروق تي في \d{4}-\d{2}-\d{2} \d{2}:\d{2}', + 'ext': 'mp4', + 'live_status': 'is_live', + } + }, { + 'url': 'https://www.echoroukonline.com/live-news', + 'info_dict': { + 'id': 'echorouknews', + 'title': r're:البث الحي لقناة الشروق نيوز - آخر أخبار الجزائر \d{4}-\d{2}-\d{2} \d{2}:\d{2}', + 'ext': 'mp4', + 'live_status': 'is_live', + } + }] + + def _real_extract(self, url): + webpage = self._download_webpage(url, url) + + title_match = re.search(r'(.*?)', webpage, re.IGNORECASE | re.DOTALL) + title = title_match.group(1).strip() if title_match else 'Live Stream' + + player_url_match = re.search( + r'https://live\.dzsecurity\.net/live/player/([a-zA-Z0-9_-]+)', + webpage + ) + if not player_url_match: + raise ExtractorError("Player URL not found in the page") + + player_url = player_url_match.group(0) + stream_id = player_url_match.group(1) + + parsed = urlparse(url) + base_url = f'{parsed.scheme}://{parsed.netloc}' + + headers = { + 'Referer': base_url, + } + + player_page = self._download_webpage(player_url, player_url, headers=headers) + + m3u8_match = re.search( + r'src:\s*location\.protocol\s*\+\s*"(?P//[^"]+\.m3u8\?[^"]+)"', + player_page + ) + if not m3u8_match: + raise ExtractorError("M3U8 stream URL not found in player page") + + m3u8_url = parsed.scheme + ':' + m3u8_match.group('url') + + return { + 'id': stream_id, + 'title': title, + 'formats': self._extract_m3u8_formats( + m3u8_url, stream_id, ext='mp4', entry_protocol='m3u8', + m3u8_id='hls', fatal=True + ), + 'is_live': True, + }