1
0
mirror of https://github.com/yt-dlp/yt-dlp.git synced 2025-06-27 17:08:32 +00:00
yt-dlp/test/test_jsi_external.py
2025-05-02 03:59:11 -04:00

207 lines
8.5 KiB
Python

#!/usr/bin/env python3
from __future__ import annotations
import os
import dataclasses
import datetime
import time
import sys
import unittest
import http.cookiejar
import functools
import typing
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from test.helper import FakeYDL
from yt_dlp.cookies import YoutubeDLCookieJar
from yt_dlp.jsinterp.common import get_included_jsi
from yt_dlp.jsinterp._helper import prepare_wasm_jsmodule
if typing.TYPE_CHECKING:
from yt_dlp.jsinterp.common import JSI
@dataclasses.dataclass
class NetscapeFields:
name: str
value: str
domain: str
path: str
secure: bool
expires: int | None
def to_cookie(self):
return http.cookiejar.Cookie(
0, self.name, self.value,
None, False,
self.domain, True, self.domain.startswith('.'),
self.path, True,
self.secure, self.expires, False,
None, None, {},
)
def expire_str(self):
return datetime.datetime.fromtimestamp(
self.expires, datetime.timezone.utc).strftime('%a, %d %b %Y %H:%M:%S GMT')
def __eq__(self, other: NetscapeFields | http.cookiejar.Cookie):
return all(getattr(self, attr) == getattr(other, attr) for attr in ['name', 'value', 'domain', 'path', 'secure', 'expires'])
def use_jsi_rumtimes(exclude=[]):
def inner(func: typing.Callable[[unittest.TestCase, type[JSI]], None]):
@functools.wraps(func)
def wrapper(self: unittest.TestCase):
for key, jsi in get_included_jsi(exclude=exclude).items():
def wrapped_jsi_with_unavaliable_auto_skip(*args, **kwargs):
if getattr(jsi, 'TEST_DATA_PLUGIN', False):
self.skipTest('Testdata plugin')
instance = jsi(*args, **kwargs)
if not instance.is_available():
self.skipTest(f'{key} is not available')
return instance
with self.subTest(key):
func(self, wrapped_jsi_with_unavaliable_auto_skip)
return wrapper
return inner
class TestExternalJSI(unittest.TestCase):
_TESTDATA_DIR = os.path.join(os.path.dirname(os.path.abspath(__file__)), 'testdata', 'jsi_external')
maxDiff = 2000
def setUp(self):
self.ydl = FakeYDL()
@use_jsi_rumtimes()
def test_execute(self, jsi_cls: type[JSI]):
jsi = jsi_cls(self.ydl, '', 10)
self.assertEqual(jsi.execute('console.log("Hello, world!");'), 'Hello, world!')
@use_jsi_rumtimes()
def test_user_agent(self, jsi_cls: type[JSI]):
ua = self.ydl.params['http_headers']['User-Agent']
jsi = jsi_cls(self.ydl, '', 10)
self.assertEqual(jsi.execute('console.log(navigator.userAgent);'), ua)
self.assertNotEqual(jsi.execute('console.log(JSON.stringify(navigator.webdriver));'), 'true')
jsi = jsi_cls(self.ydl, '', 10, user_agent='test/ua')
self.assertEqual(jsi.execute('console.log(navigator.userAgent);'), 'test/ua')
@use_jsi_rumtimes()
def test_location(self, jsi_cls: type[JSI]):
jsi = jsi_cls(self.ydl, 'https://example.com/123/456', 10)
self.assertEqual(jsi.execute('console.log(JSON.stringify([location.href, location.hostname]));'),
'["https://example.com/123/456","example.com"]')
@use_jsi_rumtimes(exclude=['Deno'])
def test_execute_dom_parse(self, jsi_cls: type[JSI]):
jsi = jsi_cls(self.ydl, '', 10)
self.assertEqual(jsi.execute(
'console.log(document.getElementById("test-div").innerHTML);',
html='<html><body><div id="test-div">Hello, world!</div></body></html>'),
'Hello, world!')
@use_jsi_rumtimes(exclude=['Deno'])
def test_execute_dom_script(self, jsi_cls: type[JSI]):
jsi = jsi_cls(self.ydl, '', 10)
self.assertEqual(jsi.execute(
'console.log(document.getElementById("test-div").innerHTML);',
html='''<html><head><title>Hello, world!</title><body>
<div id="test-div"></div>
<script src="https://example.com/script.js"></script>
<script type="text/javascript">
document.getElementById("test-div").innerHTML = document.title;
console.log('this should not show up');
a = b; // Errors should be ignored
</script>
</body></html>'''),
'Hello, world!')
@use_jsi_rumtimes(exclude=['Deno'])
def test_dom_location(self, jsi_cls: type[JSI]):
jsi = jsi_cls(self.ydl, 'https://example.com/123/456', 10)
self.assertEqual(jsi.execute(
'console.log(document.getElementById("test-div").innerHTML);',
html='''<html><head><script>
document.querySelector("#test-div").innerHTML = document.domain</script></head>
<body><div id="test-div">Hello, world!</div></body></html>'''),
'example.com')
@use_jsi_rumtimes(exclude=['Deno'])
def test_execute_cookiejar(self, jsi_cls: type[JSI]):
cookiejar = YoutubeDLCookieJar()
ref_cookiejar = YoutubeDLCookieJar()
def _assert_expected_execute(cookie_str, ref_cookie_str):
self.assertEqual(set(cookie_str.split('; ')), set(ref_cookie_str.split('; ')))
for cookie in cookiejar:
ref_cookie = next((c for c in ref_cookiejar if c.name == cookie.name
and c.domain == cookie.domain), None)
self.assertEqual(repr(cookie), repr(ref_cookie))
for test_cookie in [
NetscapeFields('test1', 'test1', '.example.com', '/', False, int(time.time()) + 1000),
NetscapeFields('test2', 'test2', '.example.com', '/', True, int(time.time()) + 1000),
NetscapeFields('test3', 'test3', '.example.com', '/123', False, int(time.time()) + 1000),
NetscapeFields('test4', 'test4', '.example.com', '/456', False, int(time.time()) + 1000),
NetscapeFields('test5', 'test5', '.example.com', '/123', True, int(time.time()) + 1000),
NetscapeFields('test6', 'test6', '.example.com', '/456', True, int(time.time()) + 1000),
NetscapeFields('test1', 'other1', '.other.com', '/', False, int(time.time()) + 1000),
NetscapeFields('test2', 'other2', '.other.com', '/', False, int(time.time()) + 1000),
NetscapeFields('test7', 'other7', '.other.com', '/', False, int(time.time()) + 1000),
]:
cookiejar.set_cookie(test_cookie.to_cookie())
ref_cookiejar.set_cookie(test_cookie.to_cookie())
# test identity without modification from js
jsi = jsi_cls(self.ydl, 'http://example.com/123/456', 10)
_assert_expected_execute(jsi.execute(
'console.log(document.cookie);', cookiejar=cookiejar),
'test1=test1; test3=test3')
# test modification of existing cookie from js
new_cookie_1 = NetscapeFields('test1', 'new1', '.example.com', '/', True, int(time.time()) + 900)
new_cookie_2 = NetscapeFields('test2', 'new2', '.example.com', '/', True, int(time.time()) + 900)
ref_cookiejar.set_cookie(new_cookie_1.to_cookie())
ref_cookiejar.set_cookie(new_cookie_2.to_cookie())
# change to https url to test secure-domain behavior
jsi = jsi_cls(self.ydl, 'https://example.com/123/456', 10)
_assert_expected_execute(jsi.execute(
f'''document.cookie = "test1=new1; secure; expires={new_cookie_1.expire_str()}; domain=.example.com; path=/";
console.log(document.cookie);''',
html=f'''<html><body><div id="test-div">Hello, world!</div>
<script>
document.cookie = "test2=new2; secure; expires={new_cookie_2.expire_str()}; domain=.example.com; path=/";
</script>
</body></html>''',
cookiejar=cookiejar),
'test1=new1; test2=new2; test3=test3; test5=test5')
@use_jsi_rumtimes(exclude=['PhantomJS'])
def test_wasm(self, jsi_cls: type[JSI]):
with open(os.path.join(self._TESTDATA_DIR, 'hello_wasm.js')) as f:
js_mod = f.read()
with open(os.path.join(self._TESTDATA_DIR, 'hello_wasm_bg.wasm'), 'rb') as f:
wasm = f.read()
js_base = prepare_wasm_jsmodule(js_mod, wasm)
js_code = js_base + ''';
console.log(add(1, 2));
greet('world');
'''
jsi = jsi_cls(self.ydl, '', 10)
self.assertEqual(jsi.execute(js_code), '3\nHello, world!')
if __name__ == '__main__':
unittest.main()