diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 4b71a621c..e2411ecfa 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -256,7 +256,7 @@ jobs:
with:
path: |
~/yt-dlp-build-venv
- key: cache-reqs-${{ github.job }}
+ key: cache-reqs-${{ github.job }}-${{ github.ref }}
- name: Install Requirements
run: |
@@ -331,19 +331,16 @@ jobs:
if: steps.restore-cache.outputs.cache-hit == 'true'
env:
GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
- cache_key: cache-reqs-${{ github.job }}
- repository: ${{ github.repository }}
- branch: ${{ github.ref }}
+ cache_key: cache-reqs-${{ github.job }}-${{ github.ref }}
run: |
- gh extension install actions/gh-actions-cache
- gh actions-cache delete "${cache_key}" -R "${repository}" -B "${branch}" --confirm
+ gh cache delete "${cache_key}"
- name: Cache requirements
uses: actions/cache/save@v4
with:
path: |
~/yt-dlp-build-venv
- key: cache-reqs-${{ github.job }}
+ key: cache-reqs-${{ github.job }}-${{ github.ref }}
macos_legacy:
needs: process
diff --git a/.gitignore b/.gitignore
index 8fcd0de64..40bb34d2a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -105,6 +105,8 @@ README.txt
*.zsh
*.spec
test/testdata/sigs/player-*.js
+test/testdata/thumbnails/empty.webp
+test/testdata/thumbnails/foo\ %d\ bar/foo_%d.*
# Binary
/youtube-dl
diff --git a/CONTRIBUTORS b/CONTRIBUTORS
index 5710f9a9e..ea391bc15 100644
--- a/CONTRIBUTORS
+++ b/CONTRIBUTORS
@@ -770,3 +770,12 @@ NeonMan
pj47x
troex
WouterGordts
+baierjan
+GeoffreyFrogeye
+Pawka
+v3DJG6GL
+yozel
+brian6932
+iednod55
+maxbin123
+nullpos
diff --git a/Changelog.md b/Changelog.md
index 513724bf4..dd95abc86 100644
--- a/Changelog.md
+++ b/Changelog.md
@@ -4,6 +4,107 @@ # Changelog
# To create a release, dispatch the https://github.com/yt-dlp/yt-dlp/actions/workflows/release.yml workflow on master
-->
+### 2025.06.09
+
+#### Extractor changes
+- [Improve JSON LD thumbnails extraction](https://github.com/yt-dlp/yt-dlp/commit/85c8a405e3651dc041b758f4744d4fb3c4c55e01) ([#13368](https://github.com/yt-dlp/yt-dlp/issues/13368)) by [bashonly](https://github.com/bashonly), [doe1080](https://github.com/doe1080)
+- **10play**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/6d265388c6e943419ac99e9151cf75a3265f980f) ([#13349](https://github.com/yt-dlp/yt-dlp/issues/13349)) by [bashonly](https://github.com/bashonly)
+- **adobepass**
+ - [Add Fubo MSO](https://github.com/yt-dlp/yt-dlp/commit/eee90acc47d7f8de24afaa8b0271ccaefdf6e88c) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [maxbin123](https://github.com/maxbin123)
+ - [Always add newer user-agent when required](https://github.com/yt-dlp/yt-dlp/commit/0ee1102268cf31b07f8a8318a47424c66b2f7378) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+ - [Fix Philo MSO authentication](https://github.com/yt-dlp/yt-dlp/commit/943083edcd3df45aaa597a6967bc6c95b720f54c) ([#13335](https://github.com/yt-dlp/yt-dlp/issues/13335)) by [Sipherdrakon](https://github.com/Sipherdrakon)
+ - [Rework to require software statement](https://github.com/yt-dlp/yt-dlp/commit/711c5d5d098fee2992a1a624b1c4b30364b91426) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly), [maxbin123](https://github.com/maxbin123)
+ - [Validate login URL before sending credentials](https://github.com/yt-dlp/yt-dlp/commit/89c1b349ad81318d9d3bea76c01c891696e58d38) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+- **aenetworks**
+ - [Fix playlist extractors](https://github.com/yt-dlp/yt-dlp/commit/f37d599a697e82fe68b423865897d55bae34f373) ([#13408](https://github.com/yt-dlp/yt-dlp/issues/13408)) by [Sipherdrakon](https://github.com/Sipherdrakon)
+ - [Fix provider-locked content extraction](https://github.com/yt-dlp/yt-dlp/commit/6693d6603358ae6beca834dbd822a7917498b813) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [maxbin123](https://github.com/maxbin123)
+- **bilibilibangumi**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/13e55162719528d42d2133e16b65ff59a667a6e4) ([#13416](https://github.com/yt-dlp/yt-dlp/issues/13416)) by [c-basalt](https://github.com/c-basalt)
+- **brightcove**: new: [Adapt to new AdobePass requirement](https://github.com/yt-dlp/yt-dlp/commit/98f8eec956e3b16cb66a3d49cc71af3807db795e) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+- **cu.ntv.co.jp**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/aa863ddab9b1d104678e9cf39bb76f5b14fca660) ([#13302](https://github.com/yt-dlp/yt-dlp/issues/13302)) by [doe1080](https://github.com/doe1080), [nullpos](https://github.com/nullpos)
+- **go**: [Fix provider-locked content extraction](https://github.com/yt-dlp/yt-dlp/commit/2e5bf002dad16f5ce35aa2023d392c9e518fcd8f) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly), [maxbin123](https://github.com/maxbin123)
+- **nbc**: [Rework and adapt extractors to new AdobePass flow](https://github.com/yt-dlp/yt-dlp/commit/2d7949d5642bc37d1e71bf00c9a55260e5505d58) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+- **nobelprize**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/97ddfefeb4faba6e61cd80996c16952b8eab16f3) ([#13205](https://github.com/yt-dlp/yt-dlp/issues/13205)) by [doe1080](https://github.com/doe1080)
+- **odnoklassniki**: [Detect and raise when login is required](https://github.com/yt-dlp/yt-dlp/commit/148a1eb4c59e127965396c7a6e6acf1979de459e) ([#13361](https://github.com/yt-dlp/yt-dlp/issues/13361)) by [bashonly](https://github.com/bashonly)
+- **patreon**: [Fix m3u8 formats extraction](https://github.com/yt-dlp/yt-dlp/commit/e0d6c0822930f6e63f574d46d946a58b73ecd10c) ([#13266](https://github.com/yt-dlp/yt-dlp/issues/13266)) by [bashonly](https://github.com/bashonly) (With fixes in [1a8a03e](https://github.com/yt-dlp/yt-dlp/commit/1a8a03ea8d827107319a18076ee3505090667c5a))
+- **podchaser**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/538eb305673c26bff6a2b12f1c96375fe02ce41a) ([#13271](https://github.com/yt-dlp/yt-dlp/issues/13271)) by [bashonly](https://github.com/bashonly)
+- **sr**: mediathek: [Improve metadata extraction](https://github.com/yt-dlp/yt-dlp/commit/e3c605a61f4cc2de9059f37434fa108c3c20f58e) ([#13294](https://github.com/yt-dlp/yt-dlp/issues/13294)) by [doe1080](https://github.com/doe1080)
+- **stacommu**: [Avoid partial stream formats](https://github.com/yt-dlp/yt-dlp/commit/5d96527be80dc1ed1702d9cd548ff86de570ad70) ([#13412](https://github.com/yt-dlp/yt-dlp/issues/13412)) by [bashonly](https://github.com/bashonly)
+- **startrek**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/a8bf0011bde92b3f1324a98bfbd38932fd3ebe18) ([#13188](https://github.com/yt-dlp/yt-dlp/issues/13188)) by [doe1080](https://github.com/doe1080)
+- **svt**: play: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/e1b6062f8c4a3fa33c65269d48d09ec78de765a2) ([#13329](https://github.com/yt-dlp/yt-dlp/issues/13329)) by [barsnick](https://github.com/barsnick), [bashonly](https://github.com/bashonly)
+- **telecinco**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/03dba2012d9bd3f402fa8c2f122afba89bbd22a4) ([#13379](https://github.com/yt-dlp/yt-dlp/issues/13379)) by [bashonly](https://github.com/bashonly)
+- **theplatform**: [Improve metadata extraction](https://github.com/yt-dlp/yt-dlp/commit/ed108b3ea481c6a4b5215a9302ba92d74baa2425) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+- **toutiao**: [Add extractor](https://github.com/yt-dlp/yt-dlp/commit/f8051e3a61686c5db1de5f5746366ecfbc3ad20c) ([#13246](https://github.com/yt-dlp/yt-dlp/issues/13246)) by [doe1080](https://github.com/doe1080)
+- **turner**: [Adapt extractors to new AdobePass flow](https://github.com/yt-dlp/yt-dlp/commit/0daddc780d3ac5bebc3a3ec5b884d9243cbc0745) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+- **twitcasting**: [Fix password-protected livestream support](https://github.com/yt-dlp/yt-dlp/commit/52f9729c9a92ad4656d746ff0b1acecb87b3e96d) ([#13097](https://github.com/yt-dlp/yt-dlp/issues/13097)) by [bashonly](https://github.com/bashonly)
+- **twitter**: broadcast: [Support events URLs](https://github.com/yt-dlp/yt-dlp/commit/7794374de8afb20499b023107e2abfd4e6b93ee4) ([#13248](https://github.com/yt-dlp/yt-dlp/issues/13248)) by [doe1080](https://github.com/doe1080)
+- **umg**: de: [Rework extractor](https://github.com/yt-dlp/yt-dlp/commit/4e7c1ea346b510280218b47e8653dbbca3a69870) ([#13373](https://github.com/yt-dlp/yt-dlp/issues/13373)) by [doe1080](https://github.com/doe1080)
+- **vice**: [Mark extractors as broken](https://github.com/yt-dlp/yt-dlp/commit/6121559e027a04574690799c1776bc42bb51af31) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [bashonly](https://github.com/bashonly)
+- **vimeo**: [Extract subtitles from player subdomain](https://github.com/yt-dlp/yt-dlp/commit/c723c4e5e78263df178dbe69844a3d05f3ef9e35) ([#13350](https://github.com/yt-dlp/yt-dlp/issues/13350)) by [bashonly](https://github.com/bashonly)
+- **watchespn**: [Fix provider-locked content extraction](https://github.com/yt-dlp/yt-dlp/commit/b094747e93cfb0a2c53007120e37d0d84d41f030) ([#13131](https://github.com/yt-dlp/yt-dlp/issues/13131)) by [maxbin123](https://github.com/maxbin123)
+- **weverse**: [Support login with oauth refresh tokens](https://github.com/yt-dlp/yt-dlp/commit/3fe72e9eea38d9a58211cde42cfaa577ce020e2c) ([#13284](https://github.com/yt-dlp/yt-dlp/issues/13284)) by [bashonly](https://github.com/bashonly)
+- **youtube**
+ - [Add `tv_simply` player client](https://github.com/yt-dlp/yt-dlp/commit/1fd0e88b67db53ad163393d6965f68e908fa70e3) ([#13389](https://github.com/yt-dlp/yt-dlp/issues/13389)) by [gamer191](https://github.com/gamer191)
+ - [Extract srt subtitles](https://github.com/yt-dlp/yt-dlp/commit/231349786e8c42089c2e079ec94c0ea866c37999) ([#13411](https://github.com/yt-dlp/yt-dlp/issues/13411)) by [gamer191](https://github.com/gamer191)
+ - [Fix `--mark-watched` support](https://github.com/yt-dlp/yt-dlp/commit/b5be29fa58ec98226e11621fd9c58585bcff6879) ([#13222](https://github.com/yt-dlp/yt-dlp/issues/13222)) by [brian6932](https://github.com/brian6932), [iednod55](https://github.com/iednod55)
+ - [Fix automatic captions for some client combinations](https://github.com/yt-dlp/yt-dlp/commit/53ea743a9c158f8ca2d75a09ca44ba68606042d8) ([#13268](https://github.com/yt-dlp/yt-dlp/issues/13268)) by [bashonly](https://github.com/bashonly)
+ - [Improve signature extraction debug output](https://github.com/yt-dlp/yt-dlp/commit/d30a49742cfa22e61c47df4ac0e7334d648fb85d) ([#13327](https://github.com/yt-dlp/yt-dlp/issues/13327)) by [bashonly](https://github.com/bashonly)
+ - [Rework nsig function name extraction](https://github.com/yt-dlp/yt-dlp/commit/9e38b273b7ac942e7e9fc05a651ed810ab7d30ba) ([#13403](https://github.com/yt-dlp/yt-dlp/issues/13403)) by [Grub4K](https://github.com/Grub4K)
+ - [nsig code improvements and cleanup](https://github.com/yt-dlp/yt-dlp/commit/f7bbf5a617f9ab54ef51eaef99be36e175b5e9c3) ([#13280](https://github.com/yt-dlp/yt-dlp/issues/13280)) by [bashonly](https://github.com/bashonly)
+- **zdf**: [Fix language extraction and format sorting](https://github.com/yt-dlp/yt-dlp/commit/db162b76f6bdece50babe2e0cacfe56888c2e125) ([#13313](https://github.com/yt-dlp/yt-dlp/issues/13313)) by [InvalidUsernameException](https://github.com/InvalidUsernameException)
+
+#### Misc. changes
+- **build**
+ - [Exclude `pkg_resources` from being collected](https://github.com/yt-dlp/yt-dlp/commit/cc749a8a3b8b6e5c05318868c72a403f376a1b38) ([#13320](https://github.com/yt-dlp/yt-dlp/issues/13320)) by [bashonly](https://github.com/bashonly)
+ - [Fix macOS requirements caching](https://github.com/yt-dlp/yt-dlp/commit/201812100f315c6727a4418698d5b4e8a79863d4) ([#13328](https://github.com/yt-dlp/yt-dlp/issues/13328)) by [bashonly](https://github.com/bashonly)
+- **cleanup**: Miscellaneous: [339614a](https://github.com/yt-dlp/yt-dlp/commit/339614a173c74b42d63e858c446a9cae262a13af) by [bashonly](https://github.com/bashonly)
+- **test**: postprocessors: [Remove binary thumbnail test data](https://github.com/yt-dlp/yt-dlp/commit/a9b370069838e84d44ac7ad095d657003665885a) ([#13341](https://github.com/yt-dlp/yt-dlp/issues/13341)) by [bashonly](https://github.com/bashonly)
+
+### 2025.05.22
+
+#### Core changes
+- **cookies**: [Fix Linux desktop environment detection](https://github.com/yt-dlp/yt-dlp/commit/e491fd4d090db3af52a82863fb0553dd5e17fb85) ([#13197](https://github.com/yt-dlp/yt-dlp/issues/13197)) by [mbway](https://github.com/mbway)
+- **jsinterp**: [Fix increment/decrement evaluation](https://github.com/yt-dlp/yt-dlp/commit/167d7a9f0ffd1b4fe600193441bdb7358db2740b) ([#13238](https://github.com/yt-dlp/yt-dlp/issues/13238)) by [bashonly](https://github.com/bashonly), [seproDev](https://github.com/seproDev)
+
+#### Extractor changes
+- **1tv**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/41c0a1fb89628696f8bb88e2b9f3a68f355b8c26) ([#13168](https://github.com/yt-dlp/yt-dlp/issues/13168)) by [bashonly](https://github.com/bashonly)
+- **amcnetworks**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/464c84fedf78eef822a431361155f108b5df96d7) ([#13147](https://github.com/yt-dlp/yt-dlp/issues/13147)) by [bashonly](https://github.com/bashonly)
+- **bitchute**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/1d0f6539c47e5d5c68c3c47cdb7075339e2885ac) ([#13081](https://github.com/yt-dlp/yt-dlp/issues/13081)) by [bashonly](https://github.com/bashonly)
+- **cartoonnetwork**: [Remove extractor](https://github.com/yt-dlp/yt-dlp/commit/7dbb47f84f0ee1266a3a01f58c9bc4c76d76794a) ([#13148](https://github.com/yt-dlp/yt-dlp/issues/13148)) by [bashonly](https://github.com/bashonly)
+- **iprima**: [Fix login support](https://github.com/yt-dlp/yt-dlp/commit/a7d9a5eb79ceeecb851389f3f2c88597871ca3f2) ([#12937](https://github.com/yt-dlp/yt-dlp/issues/12937)) by [baierjan](https://github.com/baierjan)
+- **jiosaavn**
+ - artist: [Add extractor](https://github.com/yt-dlp/yt-dlp/commit/586b557b124f954d3f625360ebe970989022ad97) ([#12803](https://github.com/yt-dlp/yt-dlp/issues/12803)) by [subrat-lima](https://github.com/subrat-lima)
+ - playlist, show: [Add extractor](https://github.com/yt-dlp/yt-dlp/commit/317f4b8006c2c0f0f64f095b1485163ad97c9053) ([#12803](https://github.com/yt-dlp/yt-dlp/issues/12803)) by [subrat-lima](https://github.com/subrat-lima)
+ - show: [Add extractor](https://github.com/yt-dlp/yt-dlp/commit/6839276496d8814cf16f58b637e45663467928e6) ([#12803](https://github.com/yt-dlp/yt-dlp/issues/12803)) by [subrat-lima](https://github.com/subrat-lima)
+- **lrtradio**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/abf58dcd6a09e14eec4ea82ae12f79a0337cb383) ([#13200](https://github.com/yt-dlp/yt-dlp/issues/13200)) by [Pawka](https://github.com/Pawka)
+- **nebula**: [Support `--mark-watched`](https://github.com/yt-dlp/yt-dlp/commit/20f288bdc2173c7cc58d709d25ca193c1f6001e7) ([#13120](https://github.com/yt-dlp/yt-dlp/issues/13120)) by [GeoffreyFrogeye](https://github.com/GeoffreyFrogeye)
+- **niconico**
+ - [Fix error handling](https://github.com/yt-dlp/yt-dlp/commit/f569be4602c2a857087e495d5d7ed6060cd97abe) ([#13236](https://github.com/yt-dlp/yt-dlp/issues/13236)) by [bashonly](https://github.com/bashonly)
+ - live: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/7a7b85c9014d96421e18aa7ea5f4c1bee5ceece0) ([#13045](https://github.com/yt-dlp/yt-dlp/issues/13045)) by [doe1080](https://github.com/doe1080)
+- **nytimesarticle**: [Fix extraction](https://github.com/yt-dlp/yt-dlp/commit/b26bc32579c00ef579d75a835807ccc87d20ee0a) ([#13104](https://github.com/yt-dlp/yt-dlp/issues/13104)) by [bashonly](https://github.com/bashonly)
+- **once**: [Remove extractor](https://github.com/yt-dlp/yt-dlp/commit/f475e8b529d18efdad603ffda02a56e707fe0e2c) ([#13164](https://github.com/yt-dlp/yt-dlp/issues/13164)) by [bashonly](https://github.com/bashonly)
+- **picarto**: vod: [Support `/profile/` video URLs](https://github.com/yt-dlp/yt-dlp/commit/31e090cb787f3504ec25485adff9a2a51d056734) ([#13227](https://github.com/yt-dlp/yt-dlp/issues/13227)) by [subrat-lima](https://github.com/subrat-lima)
+- **playsuisse**: [Improve metadata extraction](https://github.com/yt-dlp/yt-dlp/commit/d880e060803ae8ed5a047e578cca01e1f0e630ce) ([#12466](https://github.com/yt-dlp/yt-dlp/issues/12466)) by [v3DJG6GL](https://github.com/v3DJG6GL)
+- **sprout**: [Remove extractor](https://github.com/yt-dlp/yt-dlp/commit/cbcfe6378dde33a650e3852ab17ad4503b8e008d) ([#13149](https://github.com/yt-dlp/yt-dlp/issues/13149)) by [bashonly](https://github.com/bashonly)
+- **svtpage**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/ea8498ed534642dd7e925961b97b934987142fd3) ([#12957](https://github.com/yt-dlp/yt-dlp/issues/12957)) by [diman8](https://github.com/diman8)
+- **twitch**: [Support `--live-from-start`](https://github.com/yt-dlp/yt-dlp/commit/00b1bec55249cf2ad6271d36492c51b34b6459d1) ([#13202](https://github.com/yt-dlp/yt-dlp/issues/13202)) by [bashonly](https://github.com/bashonly)
+- **vimeo**: event: [Add extractor](https://github.com/yt-dlp/yt-dlp/commit/545c1a5b6f2fe88722b41aef0e7485bf3be3f3f9) ([#13216](https://github.com/yt-dlp/yt-dlp/issues/13216)) by [bashonly](https://github.com/bashonly)
+- **wat.tv**: [Improve error handling](https://github.com/yt-dlp/yt-dlp/commit/f123cc83b3aea45053f5fa1d9141048b01fc2774) ([#13111](https://github.com/yt-dlp/yt-dlp/issues/13111)) by [bashonly](https://github.com/bashonly)
+- **weverse**: [Fix live extraction](https://github.com/yt-dlp/yt-dlp/commit/5328eda8820cc5f21dcf917684d23fbdca41831d) ([#13084](https://github.com/yt-dlp/yt-dlp/issues/13084)) by [bashonly](https://github.com/bashonly)
+- **xinpianchang**: [Fix extractor](https://github.com/yt-dlp/yt-dlp/commit/83fabf352489d52843f67e6e9cc752db86d27e6e) ([#13245](https://github.com/yt-dlp/yt-dlp/issues/13245)) by [garret1317](https://github.com/garret1317)
+- **youtube**
+ - [Add PO token support for subtitles](https://github.com/yt-dlp/yt-dlp/commit/32ed5f107c6c641958d1cd2752e130de4db55a13) ([#13234](https://github.com/yt-dlp/yt-dlp/issues/13234)) by [bashonly](https://github.com/bashonly), [coletdjnz](https://github.com/coletdjnz)
+ - [Add `web_embedded` client for age-restricted videos](https://github.com/yt-dlp/yt-dlp/commit/0feec6dc131f488428bf881519e7c69766fbb9ae) ([#13089](https://github.com/yt-dlp/yt-dlp/issues/13089)) by [bashonly](https://github.com/bashonly)
+ - [Add a PO Token Provider Framework](https://github.com/yt-dlp/yt-dlp/commit/2685654a37141cca63eda3a92da0e2706e23ccfd) ([#12840](https://github.com/yt-dlp/yt-dlp/issues/12840)) by [coletdjnz](https://github.com/coletdjnz)
+ - [Extract `media_type` for all videos](https://github.com/yt-dlp/yt-dlp/commit/ded11ebc9afba6ba33923375103e9be2d7c804e7) ([#13136](https://github.com/yt-dlp/yt-dlp/issues/13136)) by [bashonly](https://github.com/bashonly)
+ - [Fix `--live-from-start` support for premieres](https://github.com/yt-dlp/yt-dlp/commit/8f303afb43395be360cafd7ad4ce2b6e2eedfb8a) ([#13079](https://github.com/yt-dlp/yt-dlp/issues/13079)) by [arabcoders](https://github.com/arabcoders)
+ - [Fix geo-restriction error handling](https://github.com/yt-dlp/yt-dlp/commit/c7e575e31608c19c5b26c10a4229db89db5fc9a8) ([#13217](https://github.com/yt-dlp/yt-dlp/issues/13217)) by [yozel](https://github.com/yozel)
+
+#### Misc. changes
+- **build**
+ - [Bump PyInstaller to v6.13.0](https://github.com/yt-dlp/yt-dlp/commit/17cf9088d0d535e4a7feffbf02bd49cd9dae5ab9) ([#13082](https://github.com/yt-dlp/yt-dlp/issues/13082)) by [bashonly](https://github.com/bashonly)
+ - [Bump run-on-arch-action to v3](https://github.com/yt-dlp/yt-dlp/commit/9064d2482d1fe722bbb4a49731fe0711c410d1c8) ([#13088](https://github.com/yt-dlp/yt-dlp/issues/13088)) by [bashonly](https://github.com/bashonly)
+- **cleanup**: Miscellaneous: [7977b32](https://github.com/yt-dlp/yt-dlp/commit/7977b329ed97b216e37bd402f4935f28c00eac9e) by [bashonly](https://github.com/bashonly)
+
### 2025.04.30
#### Important changes
diff --git a/Makefile b/Makefile
index 6c72ead1e..273cb3cc0 100644
--- a/Makefile
+++ b/Makefile
@@ -18,10 +18,11 @@ pypi-files: AUTHORS Changelog.md LICENSE README.md README.txt supportedsites \
tar pypi-files lazy-extractors install uninstall
clean-test:
- rm -rf test/testdata/sigs/player-*.js tmp/ *.annotations.xml *.aria2 *.description *.dump *.frag \
+ rm -rf tmp/ *.annotations.xml *.aria2 *.description *.dump *.frag \
*.frag.aria2 *.frag.urls *.info.json *.live_chat.json *.meta *.part* *.tmp *.temp *.unknown_video *.ytdl \
*.3gp *.ape *.ass *.avi *.desktop *.f4v *.flac *.flv *.gif *.jpeg *.jpg *.lrc *.m4a *.m4v *.mhtml *.mkv *.mov *.mp3 *.mp4 \
- *.mpg *.mpga *.oga *.ogg *.opus *.png *.sbv *.srt *.ssa *.swf *.tt *.ttml *.url *.vtt *.wav *.webloc *.webm *.webp
+ *.mpg *.mpga *.oga *.ogg *.opus *.png *.sbv *.srt *.ssa *.swf *.tt *.ttml *.url *.vtt *.wav *.webloc *.webm *.webp \
+ test/testdata/sigs/player-*.js test/testdata/thumbnails/empty.webp "test/testdata/thumbnails/foo %d bar/foo_%d."*
clean-dist:
rm -rf yt-dlp.1.temp.md yt-dlp.1 README.txt MANIFEST build/ dist/ .coverage cover/ yt-dlp.tar.gz completions/ \
yt_dlp/extractor/lazy_extractors.py *.spec CONTRIBUTING.md.tmp yt-dlp yt-dlp.exe yt_dlp.egg-info/ AUTHORS
diff --git a/README.md b/README.md
index db6504a07..8d7f021c2 100644
--- a/README.md
+++ b/README.md
@@ -44,6 +44,7 @@
* [Post-processing Options](#post-processing-options)
* [SponsorBlock Options](#sponsorblock-options)
* [Extractor Options](#extractor-options)
+ * [Preset Aliases](#preset-aliases)
* [CONFIGURATION](#configuration)
* [Configuration file encoding](#configuration-file-encoding)
* [Authentication with netrc](#authentication-with-netrc)
@@ -348,8 +349,8 @@ ## General Options:
--no-flat-playlist Fully extract the videos of a playlist
(default)
--live-from-start Download livestreams from the start.
- Currently only supported for YouTube
- (Experimental)
+ Currently experimental and only supported
+ for YouTube and Twitch
--no-live-from-start Download livestreams from the current time
(default)
--wait-for-video MIN[-MAX][:RETRIES]
@@ -379,12 +380,12 @@ ## General Options:
an alias starts with a dash "-", it is
prefixed with "--". Arguments are parsed
according to the Python string formatting
- mini-language. E.g. --alias get-audio,-X
- "-S=aext:{0},abr -x --audio-format {0}"
- creates options "--get-audio" and "-X" that
- takes an argument (ARG0) and expands to
- "-S=aext:ARG0,abr -x --audio-format ARG0".
- All defined aliases are listed in the --help
+ mini-language. E.g. --alias get-audio,-X "-S
+ aext:{0},abr -x --audio-format {0}" creates
+ options "--get-audio" and "-X" that takes an
+ argument (ARG0) and expands to "-S
+ aext:ARG0,abr -x --audio-format ARG0". All
+ defined aliases are listed in the --help
output. Alias options can trigger more
aliases; so be careful to avoid defining
recursive options. As a safety measure, each
@@ -1109,6 +1110,10 @@ ## Extractor Options:
arguments for different extractors
## Preset Aliases:
+Predefined aliases for convenience and ease of use. Note that future
+ versions of yt-dlp may add or adjust presets, but the existing preset
+ names will not be changed or removed
+
-t mp3 -f 'ba[acodec^=mp3]/ba/b' -x --audio-format
mp3
@@ -1794,11 +1799,12 @@ # EXTRACTOR ARGUMENTS
The following extractors use this feature:
#### youtube
-* `lang`: Prefer translated metadata (`title`, `description` etc) of this language code (case-sensitive). By default, the video primary language metadata is preferred, with a fallback to `en` translated. See [youtube.py](https://github.com/yt-dlp/yt-dlp/blob/c26f9b991a0681fd3ea548d535919cec1fbbd430/yt_dlp/extractor/youtube.py#L381-L390) for list of supported content language codes
+* `lang`: Prefer translated metadata (`title`, `description` etc) of this language code (case-sensitive). By default, the video primary language metadata is preferred, with a fallback to `en` translated. See [youtube/_base.py](https://github.com/yt-dlp/yt-dlp/blob/415b4c9f955b1a0391204bd24a7132590e7b3bdb/yt_dlp/extractor/youtube/_base.py#L402-L409) for the list of supported content language codes
* `skip`: One or more of `hls`, `dash` or `translated_subs` to skip extraction of the m3u8 manifests, dash manifests and [auto-translated subtitles](https://github.com/yt-dlp/yt-dlp/issues/4090#issuecomment-1158102032) respectively
-* `player_client`: Clients to extract video data from. The currently available clients are `web`, `web_safari`, `web_embedded`, `web_music`, `web_creator`, `mweb`, `ios`, `android`, `android_vr`, `tv` and `tv_embedded`. By default, `tv,ios,web` is used, or `tv,web` is used when authenticating with cookies. The `web_music` client is added for `music.youtube.com` URLs when logged-in cookies are used. The `web_embedded` client is added for age-restricted videos but only works if the video is embeddable. The `tv_embedded` and `web_creator` clients are added for age-restricted videos if account age-verification is required. Some clients, such as `web` and `web_music`, require a `po_token` for their formats to be downloadable. Some clients, such as `web_creator`, will only work with authentication. Not all clients support authentication via cookies. You can use `default` for the default clients, or you can use `all` for all clients (not recommended). You can prefix a client with `-` to exclude it, e.g. `youtube:player_client=default,-ios`
+* `player_client`: Clients to extract video data from. The currently available clients are `web`, `web_safari`, `web_embedded`, `web_music`, `web_creator`, `mweb`, `ios`, `android`, `android_vr`, `tv`, `tv_simply` and `tv_embedded`. By default, `tv,ios,web` is used, or `tv,web` is used when authenticating with cookies. The `web_music` client is added for `music.youtube.com` URLs when logged-in cookies are used. The `web_embedded` client is added for age-restricted videos but only works if the video is embeddable. The `tv_embedded` and `web_creator` clients are added for age-restricted videos if account age-verification is required. Some clients, such as `web` and `web_music`, require a `po_token` for their formats to be downloadable. Some clients, such as `web_creator`, will only work with authentication. Not all clients support authentication via cookies. You can use `default` for the default clients, or you can use `all` for all clients (not recommended). You can prefix a client with `-` to exclude it, e.g. `youtube:player_client=default,-ios`
* `player_skip`: Skip some network requests that are generally needed for robust extraction. One or more of `configs` (skip client configs), `webpage` (skip initial webpage), `js` (skip js player), `initial_data` (skip initial data/next ep request). While these options can help reduce the number of requests needed or avoid some rate-limiting, they could cause issues such as missing formats or metadata. See [#860](https://github.com/yt-dlp/yt-dlp/pull/860) and [#12826](https://github.com/yt-dlp/yt-dlp/issues/12826) for more details
* `player_params`: YouTube player parameters to use for player requests. Will overwrite any default ones set by yt-dlp.
+* `player_js_variant`: The player javascript variant to use for signature and nsig deciphering. The known variants are: `main`, `tce`, `tv`, `tv_es6`, `phone`, `tablet`. Only `main` is recommended as a possible workaround; the others are for debugging purposes. The default is to use what is prescribed by the site, and can be selected with `actual`
* `comment_sort`: `top` or `new` (default) - choose comment sorting mode (on YouTube's side)
* `max_comments`: Limit the amount of comments to gather. Comma-separated list of integers representing `max-comments,max-parents,max-replies,max-replies-per-thread`. Default is `all,all,all,all`
* E.g. `all,all,1000,10` will get a maximum of 1000 replies total, with up to 10 replies per thread. `1000,all,100` will get a maximum of 1000 comments, with a maximum of 100 replies total
@@ -1808,8 +1814,12 @@ #### youtube
* `raise_incomplete_data`: `Incomplete Data Received` raises an error instead of reporting a warning
* `data_sync_id`: Overrides the account Data Sync ID used in Innertube API requests. This may be needed if you are using an account with `youtube:player_skip=webpage,configs` or `youtubetab:skip=webpage`
* `visitor_data`: Overrides the Visitor Data used in Innertube API requests. This should be used with `player_skip=webpage,configs` and without cookies. Note: this may have adverse effects if used improperly. If a session from a browser is wanted, you should pass cookies instead (which contain the Visitor ID)
-* `po_token`: Proof of Origin (PO) Token(s) to use. Comma seperated list of PO Tokens in the format `CLIENT.CONTEXT+PO_TOKEN`, e.g. `youtube:po_token=web.gvs+XXX,web.player=XXX,web_safari.gvs+YYY`. Context can be either `gvs` (Google Video Server URLs) or `player` (Innertube player request)
-* `player_js_variant`: The player javascript variant to use for signature and nsig deciphering. The known variants are: `main`, `tce`, `tv`, `tv_es6`, `phone`, `tablet`. Only `main` is recommended as a possible workaround; the others are for debugging purposes. The default is to use what is prescribed by the site, and can be selected with `actual`
+* `po_token`: Proof of Origin (PO) Token(s) to use. Comma seperated list of PO Tokens in the format `CLIENT.CONTEXT+PO_TOKEN`, e.g. `youtube:po_token=web.gvs+XXX,web.player=XXX,web_safari.gvs+YYY`. Context can be any of `gvs` (Google Video Server URLs), `player` (Innertube player request) or `subs` (Subtitles)
+* `pot_trace`: Enable debug logging for PO Token fetching. Either `true` or `false` (default)
+* `fetch_pot`: Policy to use for fetching a PO Token from providers. One of `always` (always try fetch a PO Token regardless if the client requires one for the given context), `never` (never fetch a PO Token), or `auto` (default; only fetch a PO Token if the client requires one for the given context)
+
+#### youtubepot-webpo
+* `bind_to_visitor_id`: Whether to use the Visitor ID instead of Visitor Data for caching WebPO tokens. Either `true` (default) or `false`
#### youtubetab (YouTube playlists, channels, feeds, etc.)
* `skip`: One or more of `webpage` (skip initial webpage download), `authcheck` (allow the download of playlists requiring authentication when no initial webpage is downloaded. This may cause unwanted behavior, see [#1122](https://github.com/yt-dlp/yt-dlp/pull/1122) for more details)
diff --git a/bundle/docker/static/entrypoint.sh b/bundle/docker/static/entrypoint.sh
index 220275974..8049e6820 100755
--- a/bundle/docker/static/entrypoint.sh
+++ b/bundle/docker/static/entrypoint.sh
@@ -2,6 +2,7 @@
set -e
source ~/.local/share/pipx/venvs/pyinstaller/bin/activate
+python -m devscripts.install_deps -o --include build
python -m devscripts.install_deps --include secretstorage --include curl-cffi
python -m devscripts.make_lazy_extractors
python devscripts/update-version.py -c "${channel}" -r "${origin}" "${version}"
diff --git a/bundle/pyinstaller.py b/bundle/pyinstaller.py
index 4184c4bc9..c2f651121 100755
--- a/bundle/pyinstaller.py
+++ b/bundle/pyinstaller.py
@@ -36,6 +36,9 @@ def main():
f'--name={name}',
'--icon=devscripts/logo.ico',
'--upx-exclude=vcruntime140.dll',
+ # Ref: https://github.com/yt-dlp/yt-dlp/issues/13311
+ # https://github.com/pyinstaller/pyinstaller/issues/9149
+ '--exclude-module=pkg_resources',
'--noconfirm',
'--additional-hooks-dir=yt_dlp/__pyinstaller',
*opts,
diff --git a/pyproject.toml b/pyproject.toml
index 7accaeeb9..3775251e1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -65,7 +65,7 @@ build = [
"build",
"hatchling",
"pip",
- "setuptools>=71.0.2", # 71.0.0 broke pyinstaller
+ "setuptools>=71.0.2,<81", # See https://github.com/pyinstaller/pyinstaller/issues/9149
"wheel",
]
dev = [
diff --git a/supportedsites.md b/supportedsites.md
index 03bd8a7c3..1fe381603 100644
--- a/supportedsites.md
+++ b/supportedsites.md
@@ -5,6 +5,8 @@ # Supported sites
Not all sites listed here are guaranteed to work; websites are constantly changing and sometimes this breaks yt-dlp's support for them.
The only reliable way to check if a site is supported is to try it.
+ - **10play**: [*10play*](## "netrc machine")
+ - **10play:season**
- **17live**
- **17live:clip**
- **17live:vod**
@@ -246,7 +248,6 @@ # Supported sites
- **Canalplus**: mycanal.fr and piwiplus.fr
- **Canalsurmas**
- **CaracolTvPlay**: [*caracoltv-play*](## "netrc machine")
- - **CartoonNetwork**
- **cbc.ca**
- **cbc.ca:player**
- **cbc.ca:player:playlist**
@@ -296,7 +297,7 @@ # Supported sites
- **CNNIndonesia**
- **ComedyCentral**
- **ComedyCentralTV**
- - **ConanClassic**
+ - **ConanClassic**: (**Currently broken**)
- **CondeNast**: Condé Nast media group: Allure, Architectural Digest, Ars Technica, Bon Appétit, Brides, Condé Nast, Condé Nast Traveler, Details, Epicurious, GQ, Glamour, Golf Digest, SELF, Teen Vogue, The New Yorker, Vanity Fair, Vogue, W Magazine, WIRED
- **CONtv**
- **CookingChannel**
@@ -318,7 +319,7 @@ # Supported sites
- **CtsNews**: 華視新聞
- **CTV**
- **CTVNews**
- - **cu.ntv.co.jp**: Nippon Television Network
+ - **cu.ntv.co.jp**: 日テレ無料TADA!
- **CultureUnplugged**
- **curiositystream**: [*curiositystream*](## "netrc machine")
- **curiositystream:collections**: [*curiositystream*](## "netrc machine")
@@ -649,7 +650,10 @@ # Supported sites
- **jiocinema**: [*jiocinema*](## "netrc machine")
- **jiocinema:series**: [*jiocinema*](## "netrc machine")
- **jiosaavn:album**
+ - **jiosaavn:artist**
- **jiosaavn:playlist**
+ - **jiosaavn:show**
+ - **jiosaavn:show:playlist**
- **jiosaavn:song**
- **Joj**
- **JoqrAg**: 超!A&G+ 文化放送 (f.k.a. AGQR) Nippon Cultural Broadcasting, Inc. (JOQR)
@@ -880,19 +884,19 @@ # Supported sites
- **Naver**
- **Naver:live**
- **navernow**
- - **nba**
- - **nba:channel**
- - **nba:embed**
- - **nba:watch**
- - **nba:watch:collection**
- - **nba:watch:embed**
+ - **nba**: (**Currently broken**)
+ - **nba:channel**: (**Currently broken**)
+ - **nba:embed**: (**Currently broken**)
+ - **nba:watch**: (**Currently broken**)
+ - **nba:watch:collection**: (**Currently broken**)
+ - **nba:watch:embed**: (**Currently broken**)
- **NBC**
- **NBCNews**
- **nbcolympics**
- - **nbcolympics:stream**
- - **NBCSports**
- - **NBCSportsStream**
- - **NBCSportsVPlayer**
+ - **nbcolympics:stream**: (**Currently broken**)
+ - **NBCSports**: (**Currently broken**)
+ - **NBCSportsStream**: (**Currently broken**)
+ - **NBCSportsVPlayer**: (**Currently broken**)
- **NBCStations**
- **ndr**: NDR.de - Norddeutscher Rundfunk
- **ndr:embed**
@@ -968,7 +972,7 @@ # Supported sites
- **Nitter**
- **njoy**: N-JOY
- **njoy:embed**
- - **NobelPrize**: (**Currently broken**)
+ - **NobelPrize**
- **NoicePodcast**
- **NonkTube**
- **NoodleMagazine**
@@ -1081,8 +1085,8 @@ # Supported sites
- **Photobucket**
- **PiaLive**
- **Piapro**: [*piapro*](## "netrc machine")
- - **Picarto**
- - **PicartoVod**
+ - **picarto**
+ - **picarto:vod**
- **Piksel**
- **Pinkbike**
- **Pinterest**
@@ -1390,16 +1394,15 @@ # Supported sites
- **Spreaker**
- **SpreakerShow**
- **SpringboardPlatform**
- - **Sprout**
- **SproutVideo**
- - **sr:mediathek**: Saarländischer Rundfunk (**Currently broken**)
+ - **sr:mediathek**: Saarländischer Rundfunk
- **SRGSSR**
- **SRGSSRPlay**: srf.ch, rts.ch, rsi.ch, rtr.ch and swissinfo.ch play sites
- **StacommuLive**: [*stacommu*](## "netrc machine")
- **StacommuVOD**: [*stacommu*](## "netrc machine")
- **StagePlusVODConcert**: [*stageplus*](## "netrc machine")
- **stanfordoc**: Stanford Open ClassRoom
- - **StarTrek**: (**Currently broken**)
+ - **startrek**: STAR TREK
- **startv**
- **Steam**
- **SteamCommunityBroadcast**
@@ -1422,12 +1425,11 @@ # Supported sites
- **SunPorno**
- **sverigesradio:episode**
- **sverigesradio:publication**
- - **SVT**
- - **SVTPage**
- - **SVTPlay**: SVT Play and Öppet arkiv
- - **SVTSeries**
+ - **svt:page**
+ - **svt:play**: SVT Play and Öppet arkiv
+ - **svt:play:series**
- **SwearnetEpisode**
- - **Syfy**: (**Currently broken**)
+ - **Syfy**
- **SYVDK**
- **SztvHu**
- **t-online.de**: (**Currently broken**)
@@ -1471,8 +1473,6 @@ # Supported sites
- **Telewebion**: (**Currently broken**)
- **Tempo**
- **TennisTV**: [*tennistv*](## "netrc machine")
- - **TenPlay**: [*10play*](## "netrc machine")
- - **TenPlaySeason**
- **TF1**
- **TFO**
- **theatercomplextown:ppv**: [*theatercomplextown*](## "netrc machine")
@@ -1510,6 +1510,7 @@ # Supported sites
- **tokfm:podcast**
- **ToonGoggles**
- **tou.tv**: [*toutv*](## "netrc machine")
+ - **toutiao**: 今日头条
- **Toypics**: Toypics video (**Currently broken**)
- **ToypicsUser**: Toypics user profile (**Currently broken**)
- **TrailerAddict**: (**Currently broken**)
@@ -1599,7 +1600,7 @@ # Supported sites
- **UKTVPlay**
- **UlizaPlayer**
- **UlizaPortal**: ulizaportal.jp
- - **umg:de**: Universal Music Deutschland (**Currently broken**)
+ - **umg:de**: Universal Music Deutschland
- **Unistra**
- **Unity**: (**Currently broken**)
- **uol.com.br**
@@ -1622,9 +1623,9 @@ # Supported sites
- **VGTV**: VGTV, BTTV, FTV, Aftenposten and Aftonbladet
- **vh1.com**
- **vhx:embed**: [*vimeo*](## "netrc machine")
- - **vice**
- - **vice:article**
- - **vice:show**
+ - **vice**: (**Currently broken**)
+ - **vice:article**: (**Currently broken**)
+ - **vice:show**: (**Currently broken**)
- **Viddler**
- **Videa**
- **video.arnes.si**: Arnes Video
@@ -1656,6 +1657,7 @@ # Supported sites
- **vimeo**: [*vimeo*](## "netrc machine")
- **vimeo:album**: [*vimeo*](## "netrc machine")
- **vimeo:channel**: [*vimeo*](## "netrc machine")
+ - **vimeo:event**: [*vimeo*](## "netrc machine")
- **vimeo:group**: [*vimeo*](## "netrc machine")
- **vimeo:likes**: [*vimeo*](## "netrc machine") Vimeo user likes
- **vimeo:ondemand**: [*vimeo*](## "netrc machine")
diff --git a/test/test_InfoExtractor.py b/test/test_InfoExtractor.py
index c6ff6209a..e6c8d574e 100644
--- a/test/test_InfoExtractor.py
+++ b/test/test_InfoExtractor.py
@@ -314,6 +314,20 @@ def test_search_json_ld_realworld(self):
},
{},
),
+ (
+ # test thumbnail_url key without URL scheme
+ r'''
+''',
+ {
+ 'thumbnails': [{'url': 'https://www.nobelprize.org/images/12693-landscape-medium-gallery.jpg'}],
+ },
+ {},
+ ),
]
for html, expected_dict, search_json_ld_kwargs in _TESTS:
expect_dict(
@@ -1933,6 +1947,137 @@ def test_search_nextjs_data(self):
with self.assertWarns(DeprecationWarning):
self.assertEqual(self.ie._search_nextjs_data('', None, default='{}'), {})
+ def test_search_nuxt_json(self):
+ HTML_TMPL = ''
+ VALID_DATA = '''
+ ["ShallowReactive",1],
+ {"data":2,"state":21,"once":25,"_errors":28,"_server_errors":30},
+ ["ShallowReactive",3],
+ {"$abcdef123456":4},
+ {"podcast":5,"activeEpisodeData":7},
+ {"podcast":6,"seasons":14},
+ {"title":10,"id":11},
+ ["Reactive",8],
+ {"episode":9,"creators":18,"empty_list":20},
+ {"title":12,"id":13,"refs":34,"empty_refs":35},
+ "Series Title",
+ "podcast-id-01",
+ "Episode Title",
+ "episode-id-99",
+ [15,16,17],
+ 1,
+ 2,
+ 3,
+ [19],
+ "Podcast Creator",
+ [],
+ {"$ssite-config":22},
+ {"env":23,"name":24,"map":26,"numbers":14},
+ "production",
+ "podcast-website",
+ ["Set"],
+ ["Reactive",27],
+ ["Map"],
+ ["ShallowReactive",29],
+ {},
+ ["NuxtError",31],
+ {"status":32,"message":33},
+ 503,
+ "Service Unavailable",
+ [36,37],
+ [38,39],
+ ["Ref",40],
+ ["ShallowRef",41],
+ ["EmptyRef",42],
+ ["EmptyShallowRef",43],
+ "ref",
+ "shallow_ref",
+ "{\\"ref\\":1}",
+ "{\\"shallow_ref\\":2}"
+ '''
+ PAYLOAD = {
+ 'data': {
+ '$abcdef123456': {
+ 'podcast': {
+ 'podcast': {
+ 'title': 'Series Title',
+ 'id': 'podcast-id-01',
+ },
+ 'seasons': [1, 2, 3],
+ },
+ 'activeEpisodeData': {
+ 'episode': {
+ 'title': 'Episode Title',
+ 'id': 'episode-id-99',
+ 'refs': ['ref', 'shallow_ref'],
+ 'empty_refs': [{'ref': 1}, {'shallow_ref': 2}],
+ },
+ 'creators': ['Podcast Creator'],
+ 'empty_list': [],
+ },
+ },
+ },
+ 'state': {
+ '$ssite-config': {
+ 'env': 'production',
+ 'name': 'podcast-website',
+ 'map': [],
+ 'numbers': [1, 2, 3],
+ },
+ },
+ 'once': [],
+ '_errors': {},
+ '_server_errors': {
+ 'status': 503,
+ 'message': 'Service Unavailable',
+ },
+ }
+ PARTIALLY_INVALID = [(
+ '''
+ {"data":1},
+ {"invalid_raw_list":2},
+ [15,16,17]
+ ''',
+ {'data': {'invalid_raw_list': [None, None, None]}},
+ ), (
+ '''
+ {"data":1},
+ ["EmptyRef",2],
+ "not valid JSON"
+ ''',
+ {'data': None},
+ ), (
+ '''
+ {"data":1},
+ ["EmptyShallowRef",2],
+ "not valid JSON"
+ ''',
+ {'data': None},
+ )]
+ INVALID = [
+ '''
+ []
+ ''',
+ '''
+ ["unsupported",1],
+ {"data":2},
+ {}
+ ''',
+ ]
+ DEFAULT = object()
+
+ self.assertEqual(self.ie._search_nuxt_json(HTML_TMPL.format(VALID_DATA), None), PAYLOAD)
+ self.assertEqual(self.ie._search_nuxt_json('', None, fatal=False), {})
+ self.assertIs(self.ie._search_nuxt_json('', None, default=DEFAULT), DEFAULT)
+
+ for data, expected in PARTIALLY_INVALID:
+ self.assertEqual(
+ self.ie._search_nuxt_json(HTML_TMPL.format(data), None, fatal=False), expected)
+
+ for data in INVALID:
+ self.assertIs(
+ self.ie._search_nuxt_json(HTML_TMPL.format(data), None, default=DEFAULT), DEFAULT)
+
if __name__ == '__main__':
unittest.main()
diff --git a/test/test_YoutubeDL.py b/test/test_YoutubeDL.py
index 708a04f92..91312e4e5 100644
--- a/test/test_YoutubeDL.py
+++ b/test/test_YoutubeDL.py
@@ -1435,6 +1435,27 @@ def test_load_plugins_compat(self):
FakeYDL().close()
assert all_plugins_loaded.value
+ def test_close_hooks(self):
+ # Should call all registered close hooks on close
+ close_hook_called = False
+ close_hook_two_called = False
+
+ def close_hook():
+ nonlocal close_hook_called
+ close_hook_called = True
+
+ def close_hook_two():
+ nonlocal close_hook_two_called
+ close_hook_two_called = True
+
+ ydl = FakeYDL()
+ ydl.add_close_hook(close_hook)
+ ydl.add_close_hook(close_hook_two)
+
+ ydl.close()
+ self.assertTrue(close_hook_called, 'Close hook was not called')
+ self.assertTrue(close_hook_two_called, 'Close hook two was not called')
+
if __name__ == '__main__':
unittest.main()
diff --git a/test/test_cookies.py b/test/test_cookies.py
index 4b9b9b5a9..f956ab187 100644
--- a/test/test_cookies.py
+++ b/test/test_cookies.py
@@ -58,6 +58,14 @@ def test_get_desktop_environment(self):
({'DESKTOP_SESSION': 'kde'}, _LinuxDesktopEnvironment.KDE3),
({'DESKTOP_SESSION': 'xfce'}, _LinuxDesktopEnvironment.XFCE),
+ ({'XDG_CURRENT_DESKTOP': 'my_custom_de', 'DESKTOP_SESSION': 'gnome'}, _LinuxDesktopEnvironment.GNOME),
+ ({'XDG_CURRENT_DESKTOP': 'my_custom_de', 'DESKTOP_SESSION': 'mate'}, _LinuxDesktopEnvironment.GNOME),
+ ({'XDG_CURRENT_DESKTOP': 'my_custom_de', 'DESKTOP_SESSION': 'kde4'}, _LinuxDesktopEnvironment.KDE4),
+ ({'XDG_CURRENT_DESKTOP': 'my_custom_de', 'DESKTOP_SESSION': 'kde'}, _LinuxDesktopEnvironment.KDE3),
+ ({'XDG_CURRENT_DESKTOP': 'my_custom_de', 'DESKTOP_SESSION': 'xfce'}, _LinuxDesktopEnvironment.XFCE),
+
+ ({'XDG_CURRENT_DESKTOP': 'my_custom_de', 'DESKTOP_SESSION': 'my_custom_de', 'GNOME_DESKTOP_SESSION_ID': 1}, _LinuxDesktopEnvironment.GNOME),
+
({'GNOME_DESKTOP_SESSION_ID': 1}, _LinuxDesktopEnvironment.GNOME),
({'KDE_FULL_SESSION': 1}, _LinuxDesktopEnvironment.KDE3),
({'KDE_FULL_SESSION': 1, 'DESKTOP_SESSION': 'kde4'}, _LinuxDesktopEnvironment.KDE4),
diff --git a/test/test_devalue.py b/test/test_devalue.py
new file mode 100644
index 000000000..29eb89e87
--- /dev/null
+++ b/test/test_devalue.py
@@ -0,0 +1,235 @@
+#!/usr/bin/env python3
+
+# Allow direct execution
+import os
+import sys
+
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+
+
+import datetime as dt
+import json
+import math
+import re
+import unittest
+
+from yt_dlp.utils.jslib import devalue
+
+
+TEST_CASES_EQUALS = [{
+ 'name': 'int',
+ 'unparsed': [-42],
+ 'parsed': -42,
+}, {
+ 'name': 'str',
+ 'unparsed': ['woo!!!'],
+ 'parsed': 'woo!!!',
+}, {
+ 'name': 'Number',
+ 'unparsed': [['Object', 42]],
+ 'parsed': 42,
+}, {
+ 'name': 'String',
+ 'unparsed': [['Object', 'yar']],
+ 'parsed': 'yar',
+}, {
+ 'name': 'Infinity',
+ 'unparsed': -4,
+ 'parsed': math.inf,
+}, {
+ 'name': 'negative Infinity',
+ 'unparsed': -5,
+ 'parsed': -math.inf,
+}, {
+ 'name': 'negative zero',
+ 'unparsed': -6,
+ 'parsed': -0.0,
+}, {
+ 'name': 'RegExp',
+ 'unparsed': [['RegExp', 'regexp', 'gim']], # XXX: flags are ignored
+ 'parsed': re.compile('regexp'),
+}, {
+ 'name': 'Date',
+ 'unparsed': [['Date', '2001-09-09T01:46:40.000Z']],
+ 'parsed': dt.datetime.fromtimestamp(1e9, tz=dt.timezone.utc),
+}, {
+ 'name': 'Array',
+ 'unparsed': [[1, 2, 3], 'a', 'b', 'c'],
+ 'parsed': ['a', 'b', 'c'],
+}, {
+ 'name': 'Array (empty)',
+ 'unparsed': [[]],
+ 'parsed': [],
+}, {
+ 'name': 'Array (sparse)',
+ 'unparsed': [[-2, 1, -2], 'b'],
+ 'parsed': [None, 'b', None],
+}, {
+ 'name': 'Object',
+ 'unparsed': [{'foo': 1, 'x-y': 2}, 'bar', 'z'],
+ 'parsed': {'foo': 'bar', 'x-y': 'z'},
+}, {
+ 'name': 'Set',
+ 'unparsed': [['Set', 1, 2, 3], 1, 2, 3],
+ 'parsed': [1, 2, 3],
+}, {
+ 'name': 'Map',
+ 'unparsed': [['Map', 1, 2], 'a', 'b'],
+ 'parsed': [['a', 'b']],
+}, {
+ 'name': 'BigInt',
+ 'unparsed': [['BigInt', '1']],
+ 'parsed': 1,
+}, {
+ 'name': 'Uint8Array',
+ 'unparsed': [['Uint8Array', 'AQID']],
+ 'parsed': [1, 2, 3],
+}, {
+ 'name': 'ArrayBuffer',
+ 'unparsed': [['ArrayBuffer', 'AQID']],
+ 'parsed': [1, 2, 3],
+}, {
+ 'name': 'str (repetition)',
+ 'unparsed': [[1, 1], 'a string'],
+ 'parsed': ['a string', 'a string'],
+}, {
+ 'name': 'None (repetition)',
+ 'unparsed': [[1, 1], None],
+ 'parsed': [None, None],
+}, {
+ 'name': 'dict (repetition)',
+ 'unparsed': [[1, 1], {}],
+ 'parsed': [{}, {}],
+}, {
+ 'name': 'Object without prototype',
+ 'unparsed': [['null']],
+ 'parsed': {},
+}, {
+ 'name': 'cross-realm POJO',
+ 'unparsed': [{}],
+ 'parsed': {},
+}]
+
+TEST_CASES_IS = [{
+ 'name': 'bool',
+ 'unparsed': [True],
+ 'parsed': True,
+}, {
+ 'name': 'Boolean',
+ 'unparsed': [['Object', False]],
+ 'parsed': False,
+}, {
+ 'name': 'undefined',
+ 'unparsed': -1,
+ 'parsed': None,
+}, {
+ 'name': 'null',
+ 'unparsed': [None],
+ 'parsed': None,
+}, {
+ 'name': 'NaN',
+ 'unparsed': -3,
+ 'parsed': math.nan,
+}]
+
+TEST_CASES_INVALID = [{
+ 'name': 'empty string',
+ 'unparsed': '',
+ 'error': ValueError,
+ 'pattern': r'expected int or list as input',
+}, {
+ 'name': 'hole',
+ 'unparsed': -2,
+ 'error': ValueError,
+ 'pattern': r'invalid integer input',
+}, {
+ 'name': 'string',
+ 'unparsed': 'hello',
+ 'error': ValueError,
+ 'pattern': r'expected int or list as input',
+}, {
+ 'name': 'number',
+ 'unparsed': 42,
+ 'error': ValueError,
+ 'pattern': r'invalid integer input',
+}, {
+ 'name': 'boolean',
+ 'unparsed': True,
+ 'error': ValueError,
+ 'pattern': r'expected int or list as input',
+}, {
+ 'name': 'null',
+ 'unparsed': None,
+ 'error': ValueError,
+ 'pattern': r'expected int or list as input',
+}, {
+ 'name': 'object',
+ 'unparsed': {},
+ 'error': ValueError,
+ 'pattern': r'expected int or list as input',
+}, {
+ 'name': 'empty array',
+ 'unparsed': [],
+ 'error': ValueError,
+ 'pattern': r'expected a non-empty list as input',
+}, {
+ 'name': 'Python negative indexing',
+ 'unparsed': [[1, 2, 3, 4, 5, 6, 7, -7], 1, 2, 3, 4, 5, 6, 7],
+ 'error': IndexError,
+ 'pattern': r'invalid index: -7',
+}]
+
+
+class TestDevalue(unittest.TestCase):
+ def test_devalue_parse_equals(self):
+ for tc in TEST_CASES_EQUALS:
+ self.assertEqual(devalue.parse(tc['unparsed']), tc['parsed'], tc['name'])
+
+ def test_devalue_parse_is(self):
+ for tc in TEST_CASES_IS:
+ self.assertIs(devalue.parse(tc['unparsed']), tc['parsed'], tc['name'])
+
+ def test_devalue_parse_invalid(self):
+ for tc in TEST_CASES_INVALID:
+ with self.assertRaisesRegex(tc['error'], tc['pattern'], msg=tc['name']):
+ devalue.parse(tc['unparsed'])
+
+ def test_devalue_parse_cyclical(self):
+ name = 'Map (cyclical)'
+ result = devalue.parse([['Map', 1, 0], 'self'])
+ self.assertEqual(result[0][0], 'self', name)
+ self.assertIs(result, result[0][1], name)
+
+ name = 'Set (cyclical)'
+ result = devalue.parse([['Set', 0, 1], 42])
+ self.assertEqual(result[1], 42, name)
+ self.assertIs(result, result[0], name)
+
+ result = devalue.parse([[0]])
+ self.assertIs(result, result[0], 'Array (cyclical)')
+
+ name = 'Object (cyclical)'
+ result = devalue.parse([{'self': 0}])
+ self.assertIs(result, result['self'], name)
+
+ name = 'Object with null prototype (cyclical)'
+ result = devalue.parse([['null', 'self', 0]])
+ self.assertIs(result, result['self'], name)
+
+ name = 'Objects (cyclical)'
+ result = devalue.parse([[1, 2], {'second': 2}, {'first': 1}])
+ self.assertIs(result[0], result[1]['first'], name)
+ self.assertIs(result[1], result[0]['second'], name)
+
+ def test_devalue_parse_revivers(self):
+ self.assertEqual(
+ devalue.parse([['indirect', 1], {'a': 2}, 'b'], revivers={'indirect': lambda x: x}),
+ {'a': 'b'}, 'revivers (indirect)')
+
+ self.assertEqual(
+ devalue.parse([['parse', 1], '{"a":0}'], revivers={'parse': lambda x: json.loads(x)}),
+ {'a': 0}, 'revivers (parse)')
+
+
+if __name__ == '__main__':
+ unittest.main()
diff --git a/test/test_jsinterp.py b/test/test_jsinterp.py
index b14069ccc..2e3cdc2a5 100644
--- a/test/test_jsinterp.py
+++ b/test/test_jsinterp.py
@@ -478,6 +478,14 @@ def test_extract_function_with_global_stack(self):
func = jsi.extract_function('c', {'e': 10}, {'f': 100, 'g': 1000})
self.assertEqual(func([1]), 1111)
+ def test_increment_decrement(self):
+ self._test('function f() { var x = 1; return ++x; }', 2)
+ self._test('function f() { var x = 1; return x++; }', 1)
+ self._test('function f() { var x = 1; x--; return x }', 0)
+ self._test('function f() { var y; var x = 1; x++, --x, x--, x--, y="z", "abc", x++; return --x }', -1)
+ self._test('function f() { var a = "test--"; return a; }', 'test--')
+ self._test('function f() { var b = 1; var a = "b--"; return a; }', 'b--')
+
if __name__ == '__main__':
unittest.main()
diff --git a/test/test_networking_utils.py b/test/test_networking_utils.py
index 204fe87bd..a2feacba7 100644
--- a/test/test_networking_utils.py
+++ b/test/test_networking_utils.py
@@ -20,7 +20,6 @@
add_accept_encoding_header,
get_redirect_method,
make_socks_proxy_opts,
- select_proxy,
ssl_load_certs,
)
from yt_dlp.networking.exceptions import (
@@ -28,7 +27,7 @@
IncompleteRead,
)
from yt_dlp.socks import ProxyType
-from yt_dlp.utils.networking import HTTPHeaderDict
+from yt_dlp.utils.networking import HTTPHeaderDict, select_proxy
TEST_DIR = os.path.dirname(os.path.abspath(__file__))
diff --git a/test/test_postprocessors.py b/test/test_postprocessors.py
index 603f85c65..ecc73e39e 100644
--- a/test/test_postprocessors.py
+++ b/test/test_postprocessors.py
@@ -8,6 +8,8 @@
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+import subprocess
+
from yt_dlp import YoutubeDL
from yt_dlp.utils import shell_quote
from yt_dlp.postprocessor import (
@@ -47,7 +49,18 @@ def test_escaping(self):
print('Skipping: ffmpeg not found')
return
- file = 'test/testdata/thumbnails/foo %d bar/foo_%d.{}'
+ test_data_dir = 'test/testdata/thumbnails'
+ generated_file = f'{test_data_dir}/empty.webp'
+
+ subprocess.check_call([
+ pp.executable, '-y', '-f', 'lavfi', '-i', 'color=c=black:s=320x320',
+ '-c:v', 'libwebp', '-pix_fmt', 'yuv420p', '-vframes', '1', generated_file,
+ ], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
+
+ file = test_data_dir + '/foo %d bar/foo_%d.{}'
+ initial_file = file.format('webp')
+ os.replace(generated_file, initial_file)
+
tests = (('webp', 'png'), ('png', 'jpg'))
for inp, out in tests:
@@ -55,11 +68,13 @@ def test_escaping(self):
if os.path.exists(out_file):
os.remove(out_file)
pp.convert_thumbnail(file.format(inp), out)
- assert os.path.exists(out_file)
+ self.assertTrue(os.path.exists(out_file))
for _, out in tests:
os.remove(file.format(out))
+ os.remove(initial_file)
+
class TestExec(unittest.TestCase):
def test_parse_cmd(self):
@@ -610,3 +625,7 @@ def test_quote_for_concat_QuotesAtEnd(self):
self.assertEqual(
r"'special '\'' characters '\'' galore'\'\'\'",
self._pp._quote_for_ffmpeg("special ' characters ' galore'''"))
+
+
+if __name__ == '__main__':
+ unittest.main()
diff --git a/test/test_pot/conftest.py b/test/test_pot/conftest.py
new file mode 100644
index 000000000..ff0667e92
--- /dev/null
+++ b/test/test_pot/conftest.py
@@ -0,0 +1,71 @@
+import collections
+
+import pytest
+
+from yt_dlp import YoutubeDL
+from yt_dlp.cookies import YoutubeDLCookieJar
+from yt_dlp.extractor.common import InfoExtractor
+from yt_dlp.extractor.youtube.pot._provider import IEContentProviderLogger
+from yt_dlp.extractor.youtube.pot.provider import PoTokenRequest, PoTokenContext
+from yt_dlp.utils.networking import HTTPHeaderDict
+
+
+class MockLogger(IEContentProviderLogger):
+
+ log_level = IEContentProviderLogger.LogLevel.TRACE
+
+ def __init__(self, *args, **kwargs):
+ super().__init__(*args, **kwargs)
+ self.messages = collections.defaultdict(list)
+
+ def trace(self, message: str):
+ self.messages['trace'].append(message)
+
+ def debug(self, message: str):
+ self.messages['debug'].append(message)
+
+ def info(self, message: str):
+ self.messages['info'].append(message)
+
+ def warning(self, message: str, *, once=False):
+ self.messages['warning'].append(message)
+
+ def error(self, message: str):
+ self.messages['error'].append(message)
+
+
+@pytest.fixture
+def ie() -> InfoExtractor:
+ ydl = YoutubeDL()
+ return ydl.get_info_extractor('Youtube')
+
+
+@pytest.fixture
+def logger() -> MockLogger:
+ return MockLogger()
+
+
+@pytest.fixture()
+def pot_request() -> PoTokenRequest:
+ return PoTokenRequest(
+ context=PoTokenContext.GVS,
+ innertube_context={'client': {'clientName': 'WEB'}},
+ innertube_host='youtube.com',
+ session_index=None,
+ player_url=None,
+ is_authenticated=False,
+ video_webpage=None,
+
+ visitor_data='example-visitor-data',
+ data_sync_id='example-data-sync-id',
+ video_id='example-video-id',
+
+ request_cookiejar=YoutubeDLCookieJar(),
+ request_proxy=None,
+ request_headers=HTTPHeaderDict(),
+ request_timeout=None,
+ request_source_address=None,
+ request_verify_tls=True,
+
+ bypass_cache=False,
+ )
diff --git a/test/test_pot/test_pot_builtin_memorycache.py b/test/test_pot/test_pot_builtin_memorycache.py
new file mode 100644
index 000000000..ea19fbe29
--- /dev/null
+++ b/test/test_pot/test_pot_builtin_memorycache.py
@@ -0,0 +1,117 @@
+import threading
+import time
+from collections import OrderedDict
+import pytest
+from yt_dlp.extractor.youtube.pot._provider import IEContentProvider, BuiltinIEContentProvider
+from yt_dlp.utils import bug_reports_message
+from yt_dlp.extractor.youtube.pot._builtin.memory_cache import MemoryLRUPCP, memorylru_preference, initialize_global_cache
+from yt_dlp.version import __version__
+from yt_dlp.extractor.youtube.pot._registry import _pot_cache_providers, _pot_memory_cache
+
+
+class TestMemoryLRUPCS:
+
+ def test_base_type(self):
+ assert issubclass(MemoryLRUPCP, IEContentProvider)
+ assert issubclass(MemoryLRUPCP, BuiltinIEContentProvider)
+
+ @pytest.fixture
+ def pcp(self, ie, logger) -> MemoryLRUPCP:
+ return MemoryLRUPCP(ie, logger, {}, initialize_cache=lambda max_size: (OrderedDict(), threading.Lock(), max_size))
+
+ def test_is_registered(self):
+ assert _pot_cache_providers.value.get('MemoryLRU') == MemoryLRUPCP
+
+ def test_initialization(self, pcp):
+ assert pcp.PROVIDER_NAME == 'memory'
+ assert pcp.PROVIDER_VERSION == __version__
+ assert pcp.BUG_REPORT_MESSAGE == bug_reports_message(before='')
+ assert pcp.is_available()
+
+ def test_store_and_get(self, pcp):
+ pcp.store('key1', 'value1', int(time.time()) + 60)
+ assert pcp.get('key1') == 'value1'
+ assert len(pcp.cache) == 1
+
+ def test_store_ignore_expired(self, pcp):
+ pcp.store('key1', 'value1', int(time.time()) - 1)
+ assert len(pcp.cache) == 0
+ assert pcp.get('key1') is None
+ assert len(pcp.cache) == 0
+
+ def test_store_override_existing_key(self, ie, logger):
+ MAX_SIZE = 2
+ pcp = MemoryLRUPCP(ie, logger, {}, initialize_cache=lambda max_size: (OrderedDict(), threading.Lock(), MAX_SIZE))
+ pcp.store('key1', 'value1', int(time.time()) + 60)
+ pcp.store('key2', 'value2', int(time.time()) + 60)
+ assert len(pcp.cache) == 2
+ pcp.store('key1', 'value2', int(time.time()) + 60)
+ # Ensure that the override key gets added to the end of the cache instead of in the same position
+ pcp.store('key3', 'value3', int(time.time()) + 60)
+ assert pcp.get('key1') == 'value2'
+
+ def test_store_ignore_expired_existing_key(self, pcp):
+ pcp.store('key1', 'value2', int(time.time()) + 60)
+ pcp.store('key1', 'value1', int(time.time()) - 1)
+ assert len(pcp.cache) == 1
+ assert pcp.get('key1') == 'value2'
+ assert len(pcp.cache) == 1
+
+ def test_get_key_expired(self, pcp):
+ pcp.store('key1', 'value1', int(time.time()) + 60)
+ assert pcp.get('key1') == 'value1'
+ assert len(pcp.cache) == 1
+ pcp.cache['key1'] = ('value1', int(time.time()) - 1)
+ assert pcp.get('key1') is None
+ assert len(pcp.cache) == 0
+
+ def test_lru_eviction(self, ie, logger):
+ MAX_SIZE = 2
+ provider = MemoryLRUPCP(ie, logger, {}, initialize_cache=lambda max_size: (OrderedDict(), threading.Lock(), MAX_SIZE))
+ provider.store('key1', 'value1', int(time.time()) + 5)
+ provider.store('key2', 'value2', int(time.time()) + 5)
+ assert len(provider.cache) == 2
+
+ assert provider.get('key1') == 'value1'
+
+ provider.store('key3', 'value3', int(time.time()) + 5)
+ assert len(provider.cache) == 2
+
+ assert provider.get('key2') is None
+
+ provider.store('key4', 'value4', int(time.time()) + 5)
+ assert len(provider.cache) == 2
+
+ assert provider.get('key1') is None
+ assert provider.get('key3') == 'value3'
+ assert provider.get('key4') == 'value4'
+
+ def test_delete(self, pcp):
+ pcp.store('key1', 'value1', int(time.time()) + 5)
+ assert len(pcp.cache) == 1
+ assert pcp.get('key1') == 'value1'
+ pcp.delete('key1')
+ assert len(pcp.cache) == 0
+ assert pcp.get('key1') is None
+
+ def test_use_global_cache_default(self, ie, logger):
+ pcp = MemoryLRUPCP(ie, logger, {})
+ assert pcp.max_size == _pot_memory_cache.value['max_size'] == 25
+ assert pcp.cache is _pot_memory_cache.value['cache']
+ assert pcp.lock is _pot_memory_cache.value['lock']
+
+ pcp2 = MemoryLRUPCP(ie, logger, {})
+ assert pcp.max_size == pcp2.max_size == _pot_memory_cache.value['max_size'] == 25
+ assert pcp.cache is pcp2.cache is _pot_memory_cache.value['cache']
+ assert pcp.lock is pcp2.lock is _pot_memory_cache.value['lock']
+
+ def test_fail_max_size_change_global(self, ie, logger):
+ pcp = MemoryLRUPCP(ie, logger, {})
+ assert pcp.max_size == _pot_memory_cache.value['max_size'] == 25
+ with pytest.raises(ValueError, match='Cannot change max_size of initialized global memory cache'):
+ initialize_global_cache(50)
+
+ assert pcp.max_size == _pot_memory_cache.value['max_size'] == 25
+
+ def test_memory_lru_preference(self, pcp, ie, pot_request):
+ assert memorylru_preference(pcp, pot_request) == 10000
diff --git a/test/test_pot/test_pot_builtin_utils.py b/test/test_pot/test_pot_builtin_utils.py
new file mode 100644
index 000000000..7645ba601
--- /dev/null
+++ b/test/test_pot/test_pot_builtin_utils.py
@@ -0,0 +1,47 @@
+import pytest
+from yt_dlp.extractor.youtube.pot.provider import (
+ PoTokenContext,
+
+)
+
+from yt_dlp.extractor.youtube.pot.utils import get_webpo_content_binding, ContentBindingType
+
+
+class TestGetWebPoContentBinding:
+
+ @pytest.mark.parametrize('client_name, context, is_authenticated, expected', [
+ *[(client, context, is_authenticated, expected) for client in [
+ 'WEB', 'MWEB', 'TVHTML5', 'WEB_EMBEDDED_PLAYER', 'WEB_CREATOR', 'TVHTML5_SIMPLY_EMBEDDED_PLAYER', 'TVHTML5_SIMPLY']
+ for context, is_authenticated, expected in [
+ (PoTokenContext.GVS, False, ('example-visitor-data', ContentBindingType.VISITOR_DATA)),
+ (PoTokenContext.PLAYER, False, ('example-video-id', ContentBindingType.VIDEO_ID)),
+ (PoTokenContext.SUBS, False, ('example-video-id', ContentBindingType.VIDEO_ID)),
+ (PoTokenContext.GVS, True, ('example-data-sync-id', ContentBindingType.DATASYNC_ID)),
+ ]],
+ ('WEB_REMIX', PoTokenContext.GVS, False, ('example-visitor-data', ContentBindingType.VISITOR_DATA)),
+ ('WEB_REMIX', PoTokenContext.PLAYER, False, ('example-visitor-data', ContentBindingType.VISITOR_DATA)),
+ ('ANDROID', PoTokenContext.GVS, False, (None, None)),
+ ('IOS', PoTokenContext.GVS, False, (None, None)),
+ ])
+ def test_get_webpo_content_binding(self, pot_request, client_name, context, is_authenticated, expected):
+ pot_request.innertube_context['client']['clientName'] = client_name
+ pot_request.context = context
+ pot_request.is_authenticated = is_authenticated
+ assert get_webpo_content_binding(pot_request) == expected
+
+ def test_extract_visitor_id(self, pot_request):
+ pot_request.visitor_data = 'CgsxMjNhYmNYWVpfLSiA4s%2DqBg%3D%3D'
+ assert get_webpo_content_binding(pot_request, bind_to_visitor_id=True) == ('123abcXYZ_-', ContentBindingType.VISITOR_ID)
+
+ def test_invalid_visitor_id(self, pot_request):
+ # visitor id not alphanumeric (i.e. protobuf extraction failed)
+ pot_request.visitor_data = 'CggxMjM0NTY3OCiA4s-qBg%3D%3D'
+ assert get_webpo_content_binding(pot_request, bind_to_visitor_id=True) == (pot_request.visitor_data, ContentBindingType.VISITOR_DATA)
+
+ def test_no_visitor_id(self, pot_request):
+ pot_request.visitor_data = 'KIDiz6oG'
+ assert get_webpo_content_binding(pot_request, bind_to_visitor_id=True) == (pot_request.visitor_data, ContentBindingType.VISITOR_DATA)
+
+ def test_invalid_base64(self, pot_request):
+ pot_request.visitor_data = 'invalid-base64'
+ assert get_webpo_content_binding(pot_request, bind_to_visitor_id=True) == (pot_request.visitor_data, ContentBindingType.VISITOR_DATA)
diff --git a/test/test_pot/test_pot_builtin_webpospec.py b/test/test_pot/test_pot_builtin_webpospec.py
new file mode 100644
index 000000000..078008415
--- /dev/null
+++ b/test/test_pot/test_pot_builtin_webpospec.py
@@ -0,0 +1,92 @@
+import pytest
+
+from yt_dlp.extractor.youtube.pot._provider import IEContentProvider, BuiltinIEContentProvider
+from yt_dlp.extractor.youtube.pot.cache import CacheProviderWritePolicy
+from yt_dlp.utils import bug_reports_message
+from yt_dlp.extractor.youtube.pot.provider import (
+ PoTokenRequest,
+ PoTokenContext,
+
+)
+from yt_dlp.version import __version__
+
+from yt_dlp.extractor.youtube.pot._builtin.webpo_cachespec import WebPoPCSP
+from yt_dlp.extractor.youtube.pot._registry import _pot_pcs_providers
+
+
+@pytest.fixture()
+def pot_request(pot_request) -> PoTokenRequest:
+ pot_request.visitor_data = 'CgsxMjNhYmNYWVpfLSiA4s%2DqBg%3D%3D' # visitor_id=123abcXYZ_-
+ return pot_request
+
+
+class TestWebPoPCSP:
+ def test_base_type(self):
+ assert issubclass(WebPoPCSP, IEContentProvider)
+ assert issubclass(WebPoPCSP, BuiltinIEContentProvider)
+
+ def test_init(self, ie, logger):
+ pcs = WebPoPCSP(ie=ie, logger=logger, settings={})
+ assert pcs.PROVIDER_NAME == 'webpo'
+ assert pcs.PROVIDER_VERSION == __version__
+ assert pcs.BUG_REPORT_MESSAGE == bug_reports_message(before='')
+ assert pcs.is_available()
+
+ def test_is_registered(self):
+ assert _pot_pcs_providers.value.get('WebPo') == WebPoPCSP
+
+ @pytest.mark.parametrize('client_name, context, is_authenticated', [
+ ('ANDROID', PoTokenContext.GVS, False),
+ ('IOS', PoTokenContext.GVS, False),
+ ('IOS', PoTokenContext.PLAYER, False),
+ ])
+ def test_not_supports(self, ie, logger, pot_request, client_name, context, is_authenticated):
+ pcs = WebPoPCSP(ie=ie, logger=logger, settings={})
+ pot_request.innertube_context['client']['clientName'] = client_name
+ pot_request.context = context
+ pot_request.is_authenticated = is_authenticated
+ assert pcs.generate_cache_spec(pot_request) is None
+
+ @pytest.mark.parametrize('client_name, context, is_authenticated, remote_host, source_address, request_proxy, expected', [
+ *[(client, context, is_authenticated, remote_host, source_address, request_proxy, expected) for client in [
+ 'WEB', 'MWEB', 'TVHTML5', 'WEB_EMBEDDED_PLAYER', 'WEB_CREATOR', 'TVHTML5_SIMPLY_EMBEDDED_PLAYER', 'TVHTML5_SIMPLY']
+ for context, is_authenticated, remote_host, source_address, request_proxy, expected in [
+ (PoTokenContext.GVS, False, 'example-remote-host', 'example-source-address', 'example-request-proxy', {'t': 'webpo', 'ip': 'example-remote-host', 'sa': 'example-source-address', 'px': 'example-request-proxy', 'cb': '123abcXYZ_-', 'cbt': 'visitor_id'}),
+ (PoTokenContext.PLAYER, False, 'example-remote-host', 'example-source-address', 'example-request-proxy', {'t': 'webpo', 'ip': 'example-remote-host', 'sa': 'example-source-address', 'px': 'example-request-proxy', 'cb': '123abcXYZ_-', 'cbt': 'video_id'}),
+ (PoTokenContext.GVS, True, 'example-remote-host', 'example-source-address', 'example-request-proxy', {'t': 'webpo', 'ip': 'example-remote-host', 'sa': 'example-source-address', 'px': 'example-request-proxy', 'cb': 'example-data-sync-id', 'cbt': 'datasync_id'}),
+ ]],
+ ('WEB_REMIX', PoTokenContext.PLAYER, False, 'example-remote-host', 'example-source-address', 'example-request-proxy', {'t': 'webpo', 'ip': 'example-remote-host', 'sa': 'example-source-address', 'px': 'example-request-proxy', 'cb': '123abcXYZ_-', 'cbt': 'visitor_id'}),
+ ('WEB', PoTokenContext.GVS, False, None, None, None, {'t': 'webpo', 'cb': '123abcXYZ_-', 'cbt': 'visitor_id', 'ip': None, 'sa': None, 'px': None}),
+ ('TVHTML5', PoTokenContext.PLAYER, False, None, None, 'http://example.com', {'t': 'webpo', 'cb': '123abcXYZ_-', 'cbt': 'video_id', 'ip': None, 'sa': None, 'px': 'http://example.com'}),
+
+ ])
+ def test_generate_key_bindings(self, ie, logger, pot_request, client_name, context, is_authenticated, remote_host, source_address, request_proxy, expected):
+ pcs = WebPoPCSP(ie=ie, logger=logger, settings={})
+ pot_request.innertube_context['client']['clientName'] = client_name
+ pot_request.context = context
+ pot_request.is_authenticated = is_authenticated
+ pot_request.innertube_context['client']['remoteHost'] = remote_host
+ pot_request.request_source_address = source_address
+ pot_request.request_proxy = request_proxy
+ pot_request.video_id = '123abcXYZ_-' # same as visitor id to test type
+
+ assert pcs.generate_cache_spec(pot_request).key_bindings == expected
+
+ def test_no_bind_visitor_id(self, ie, logger, pot_request):
+ # Should not bind to visitor id if setting is set to False
+ pcs = WebPoPCSP(ie=ie, logger=logger, settings={'bind_to_visitor_id': ['false']})
+ pot_request.innertube_context['client']['clientName'] = 'WEB'
+ pot_request.context = PoTokenContext.GVS
+ pot_request.is_authenticated = False
+ assert pcs.generate_cache_spec(pot_request).key_bindings == {'t': 'webpo', 'ip': None, 'sa': None, 'px': None, 'cb': 'CgsxMjNhYmNYWVpfLSiA4s%2DqBg%3D%3D', 'cbt': 'visitor_data'}
+
+ def test_default_ttl(self, ie, logger, pot_request):
+ pcs = WebPoPCSP(ie=ie, logger=logger, settings={})
+ assert pcs.generate_cache_spec(pot_request).default_ttl == 6 * 60 * 60 # should default to 6 hours
+
+ def test_write_policy(self, ie, logger, pot_request):
+ pcs = WebPoPCSP(ie=ie, logger=logger, settings={})
+ pot_request.context = PoTokenContext.GVS
+ assert pcs.generate_cache_spec(pot_request).write_policy == CacheProviderWritePolicy.WRITE_ALL
+ pot_request.context = PoTokenContext.PLAYER
+ assert pcs.generate_cache_spec(pot_request).write_policy == CacheProviderWritePolicy.WRITE_FIRST
diff --git a/test/test_pot/test_pot_director.py b/test/test_pot/test_pot_director.py
new file mode 100644
index 000000000..bbfdd0e98
--- /dev/null
+++ b/test/test_pot/test_pot_director.py
@@ -0,0 +1,1529 @@
+from __future__ import annotations
+import abc
+import base64
+import dataclasses
+import hashlib
+import json
+import time
+import pytest
+
+from yt_dlp.extractor.youtube.pot._provider import BuiltinIEContentProvider, IEContentProvider
+
+from yt_dlp.extractor.youtube.pot.provider import (
+ PoTokenRequest,
+ PoTokenContext,
+ PoTokenProviderError,
+ PoTokenProviderRejectedRequest,
+)
+from yt_dlp.extractor.youtube.pot._director import (
+ PoTokenCache,
+ validate_cache_spec,
+ clean_pot,
+ validate_response,
+ PoTokenRequestDirector,
+ provider_display_list,
+)
+
+from yt_dlp.extractor.youtube.pot.cache import (
+ PoTokenCacheSpec,
+ PoTokenCacheSpecProvider,
+ PoTokenCacheProvider,
+ CacheProviderWritePolicy,
+ PoTokenCacheProviderError,
+)
+
+
+from yt_dlp.extractor.youtube.pot.provider import (
+ PoTokenResponse,
+ PoTokenProvider,
+)
+
+
+class BaseMockPoTokenProvider(PoTokenProvider, abc.ABC):
+ def __init__(self, *args, **kwargs):
+ super().__init__(*args, **kwargs)
+ self.available_called_times = 0
+ self.request_called_times = 0
+ self.close_called = False
+
+ def is_available(self) -> bool:
+ self.available_called_times += 1
+ return True
+
+ def request_pot(self, *args, **kwargs):
+ self.request_called_times += 1
+ return super().request_pot(*args, **kwargs)
+
+ def close(self):
+ self.close_called = True
+ super().close()
+
+
+class ExamplePTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'example'
+ PROVIDER_VERSION = '0.0.1'
+ BUG_REPORT_LOCATION = 'https://example.com/issues'
+
+ _SUPPORTED_CLIENTS = ('WEB',)
+ _SUPPORTED_CONTEXTS = (PoTokenContext.GVS, )
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ if request.data_sync_id == 'example':
+ return PoTokenResponse(request.video_id)
+ return PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+
+def success_ptp(response: PoTokenResponse | None = None, key: str | None = None):
+ class SuccessPTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'success'
+ PROVIDER_VERSION = '0.0.1'
+ BUG_REPORT_LOCATION = 'https://success.example.com/issues'
+
+ _SUPPORTED_CLIENTS = ('WEB',)
+ _SUPPORTED_CONTEXTS = (PoTokenContext.GVS,)
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ return response or PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ if key:
+ SuccessPTP.PROVIDER_KEY = key
+ return SuccessPTP
+
+
+@pytest.fixture
+def pot_provider(ie, logger):
+ return success_ptp()(ie=ie, logger=logger, settings={})
+
+
+class UnavailablePTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'unavailable'
+ BUG_REPORT_LOCATION = 'https://unavailable.example.com/issues'
+ _SUPPORTED_CLIENTS = None
+ _SUPPORTED_CONTEXTS = None
+
+ def is_available(self) -> bool:
+ super().is_available()
+ return False
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise PoTokenProviderError('something went wrong')
+
+
+class UnsupportedPTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'unsupported'
+ BUG_REPORT_LOCATION = 'https://unsupported.example.com/issues'
+ _SUPPORTED_CLIENTS = None
+ _SUPPORTED_CONTEXTS = None
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise PoTokenProviderRejectedRequest('unsupported request')
+
+
+class ErrorPTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'error'
+ BUG_REPORT_LOCATION = 'https://error.example.com/issues'
+ _SUPPORTED_CLIENTS = None
+ _SUPPORTED_CONTEXTS = None
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ expected = request.video_id == 'expected'
+ raise PoTokenProviderError('an error occurred', expected=expected)
+
+
+class UnexpectedErrorPTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'unexpected_error'
+ BUG_REPORT_LOCATION = 'https://unexpected.example.com/issues'
+ _SUPPORTED_CLIENTS = None
+ _SUPPORTED_CONTEXTS = None
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise ValueError('an unexpected error occurred')
+
+
+class InvalidPTP(BaseMockPoTokenProvider):
+ PROVIDER_NAME = 'invalid'
+ BUG_REPORT_LOCATION = 'https://invalid.example.com/issues'
+ _SUPPORTED_CLIENTS = None
+ _SUPPORTED_CONTEXTS = None
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ if request.video_id == 'invalid_type':
+ return 'invalid-response'
+ else:
+ return PoTokenResponse('example-token?', expires_at='123')
+
+
+class BaseMockCacheSpecProvider(PoTokenCacheSpecProvider, abc.ABC):
+ def __init__(self, *args, **kwargs):
+ super().__init__(*args, **kwargs)
+ self.generate_called_times = 0
+ self.is_available_called_times = 0
+ self.close_called = False
+
+ def is_available(self) -> bool:
+ self.is_available_called_times += 1
+ return super().is_available()
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ self.generate_called_times += 1
+
+ def close(self):
+ self.close_called = True
+ super().close()
+
+
+class ExampleCacheSpecProviderPCSP(BaseMockCacheSpecProvider):
+
+ PROVIDER_NAME = 'example'
+ PROVIDER_VERSION = '0.0.1'
+ BUG_REPORT_LOCATION = 'https://example.com/issues'
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return PoTokenCacheSpec(
+ key_bindings={'v': request.video_id, 'e': None},
+ default_ttl=60,
+ )
+
+
+class UnavailableCacheSpecProviderPCSP(BaseMockCacheSpecProvider):
+
+ PROVIDER_NAME = 'unavailable'
+ PROVIDER_VERSION = '0.0.1'
+
+ def is_available(self) -> bool:
+ super().is_available()
+ return False
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return None
+
+
+class UnsupportedCacheSpecProviderPCSP(BaseMockCacheSpecProvider):
+
+ PROVIDER_NAME = 'unsupported'
+ PROVIDER_VERSION = '0.0.1'
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return None
+
+
+class InvalidSpecCacheSpecProviderPCSP(BaseMockCacheSpecProvider):
+
+ PROVIDER_NAME = 'invalid'
+ PROVIDER_VERSION = '0.0.1'
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return 'invalid-spec'
+
+
+class ErrorSpecCacheSpecProviderPCSP(BaseMockCacheSpecProvider):
+
+ PROVIDER_NAME = 'invalid'
+ PROVIDER_VERSION = '0.0.1'
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ raise ValueError('something went wrong')
+
+
+class BaseMockCacheProvider(PoTokenCacheProvider, abc.ABC):
+ BUG_REPORT_MESSAGE = 'example bug report message'
+
+ def __init__(self, *args, available=True, **kwargs):
+ super().__init__(*args, **kwargs)
+ self.store_calls = 0
+ self.delete_calls = 0
+ self.get_calls = 0
+ self.available_called_times = 0
+ self.available = available
+
+ def is_available(self) -> bool:
+ self.available_called_times += 1
+ return self.available
+
+ def store(self, *args, **kwargs):
+ self.store_calls += 1
+
+ def delete(self, *args, **kwargs):
+ self.delete_calls += 1
+
+ def get(self, *args, **kwargs):
+ self.get_calls += 1
+
+ def close(self):
+ self.close_called = True
+ super().close()
+
+
+class ErrorPCP(BaseMockCacheProvider):
+ PROVIDER_NAME = 'error'
+
+ def store(self, *args, **kwargs):
+ super().store(*args, **kwargs)
+ raise PoTokenCacheProviderError('something went wrong')
+
+ def get(self, *args, **kwargs):
+ super().get(*args, **kwargs)
+ raise PoTokenCacheProviderError('something went wrong')
+
+
+class UnexpectedErrorPCP(BaseMockCacheProvider):
+ PROVIDER_NAME = 'unexpected_error'
+
+ def store(self, *args, **kwargs):
+ super().store(*args, **kwargs)
+ raise ValueError('something went wrong')
+
+ def get(self, *args, **kwargs):
+ super().get(*args, **kwargs)
+ raise ValueError('something went wrong')
+
+
+class MockMemoryPCP(BaseMockCacheProvider):
+ PROVIDER_NAME = 'memory'
+
+ def __init__(self, *args, **kwargs):
+ super().__init__(*args, **kwargs)
+ self.cache = {}
+
+ def store(self, key, value, expires_at):
+ super().store(key, value, expires_at)
+ self.cache[key] = (value, expires_at)
+
+ def delete(self, key):
+ super().delete(key)
+ self.cache.pop(key, None)
+
+ def get(self, key):
+ super().get(key)
+ return self.cache.get(key, [None])[0]
+
+
+def create_memory_pcp(ie, logger, provider_key='memory', provider_name='memory', available=True):
+ cache = MockMemoryPCP(ie, logger, {}, available=available)
+ cache.PROVIDER_KEY = provider_key
+ cache.PROVIDER_NAME = provider_name
+ return cache
+
+
+@pytest.fixture
+def memorypcp(ie, logger) -> MockMemoryPCP:
+ return create_memory_pcp(ie, logger)
+
+
+@pytest.fixture
+def pot_cache(ie, logger):
+ class MockPoTokenCache(PoTokenCache):
+ def __init__(self, *args, **kwargs):
+ super().__init__(*args, **kwargs)
+ self.get_calls = 0
+ self.store_calls = 0
+ self.close_called = False
+
+ def get(self, *args, **kwargs):
+ self.get_calls += 1
+ return super().get(*args, **kwargs)
+
+ def store(self, *args, **kwargs):
+ self.store_calls += 1
+ return super().store(*args, **kwargs)
+
+ def close(self):
+ self.close_called = True
+ super().close()
+
+ return MockPoTokenCache(
+ cache_providers=[MockMemoryPCP(ie, logger, {})],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie, logger, settings={})],
+ logger=logger,
+ )
+
+
+EXAMPLE_PO_TOKEN = base64.urlsafe_b64encode(b'example-token').decode()
+
+
+class TestPoTokenCache:
+
+ def test_cache_success(self, memorypcp, pot_request, ie, logger):
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ cache.store(pot_request, response)
+
+ cached_response = cache.get(pot_request)
+ assert cached_response is not None
+ assert cached_response.po_token == EXAMPLE_PO_TOKEN
+ assert cached_response.expires_at is not None
+
+ assert cache.get(dataclasses.replace(pot_request, video_id='another-video-id')) is None
+
+ def test_unsupported_cache_spec_no_fallback(self, memorypcp, pot_request, ie, logger):
+ unsupported_provider = UnsupportedCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[unsupported_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ assert cache.get(pot_request) is None
+ assert unsupported_provider.generate_called_times == 1
+ cache.store(pot_request, response)
+ assert len(memorypcp.cache) == 0
+ assert unsupported_provider.generate_called_times == 2
+ assert cache.get(pot_request) is None
+ assert unsupported_provider.generate_called_times == 3
+ assert len(logger.messages.get('error', [])) == 0
+
+ def test_unsupported_cache_spec_fallback(self, memorypcp, pot_request, ie, logger):
+ unsupported_provider = UnsupportedCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ example_provider = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[unsupported_provider, example_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ assert unsupported_provider.generate_called_times == 1
+ assert example_provider.generate_called_times == 1
+
+ cache.store(pot_request, response)
+ assert unsupported_provider.generate_called_times == 2
+ assert example_provider.generate_called_times == 2
+
+ cached_response = cache.get(pot_request)
+ assert unsupported_provider.generate_called_times == 3
+ assert example_provider.generate_called_times == 3
+ assert cached_response is not None
+ assert cached_response.po_token == EXAMPLE_PO_TOKEN
+ assert cached_response.expires_at is not None
+
+ assert len(logger.messages.get('error', [])) == 0
+
+ def test_invalid_cache_spec_no_fallback(self, memorypcp, pot_request, ie, logger):
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[InvalidSpecCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ cache.store(pot_request, response)
+
+ assert cache.get(pot_request) is None
+
+ assert 'PoTokenCacheSpecProvider "InvalidSpecCacheSpecProvider" generate_cache_spec() returned invalid spec invalid-spec; please report this issue to the provider developer at (developer has not provided a bug report location) .' in logger.messages['error']
+
+ def test_invalid_cache_spec_fallback(self, memorypcp, pot_request, ie, logger):
+
+ invalid_provider = InvalidSpecCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ example_provider = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[invalid_provider, example_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ assert invalid_provider.generate_called_times == example_provider.generate_called_times == 1
+
+ cache.store(pot_request, response)
+ assert invalid_provider.generate_called_times == example_provider.generate_called_times == 2
+
+ cached_response = cache.get(pot_request)
+ assert invalid_provider.generate_called_times == example_provider.generate_called_times == 3
+ assert cached_response is not None
+ assert cached_response.po_token == EXAMPLE_PO_TOKEN
+ assert cached_response.expires_at is not None
+
+ assert 'PoTokenCacheSpecProvider "InvalidSpecCacheSpecProvider" generate_cache_spec() returned invalid spec invalid-spec; please report this issue to the provider developer at (developer has not provided a bug report location) .' in logger.messages['error']
+
+ def test_unavailable_cache_spec_no_fallback(self, memorypcp, pot_request, ie, logger):
+ unavailable_provider = UnavailableCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[unavailable_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ cache.store(pot_request, response)
+ assert cache.get(pot_request) is None
+ assert unavailable_provider.generate_called_times == 0
+
+ def test_unavailable_cache_spec_fallback(self, memorypcp, pot_request, ie, logger):
+ unavailable_provider = UnavailableCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ example_provider = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[unavailable_provider, example_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ assert unavailable_provider.generate_called_times == 0
+ assert unavailable_provider.is_available_called_times == 1
+ assert example_provider.generate_called_times == 1
+
+ cache.store(pot_request, response)
+ assert unavailable_provider.generate_called_times == 0
+ assert unavailable_provider.is_available_called_times == 2
+ assert example_provider.generate_called_times == 2
+
+ cached_response = cache.get(pot_request)
+ assert unavailable_provider.generate_called_times == 0
+ assert unavailable_provider.is_available_called_times == 3
+ assert example_provider.generate_called_times == 3
+ assert example_provider.is_available_called_times == 3
+ assert cached_response is not None
+ assert cached_response.po_token == EXAMPLE_PO_TOKEN
+ assert cached_response.expires_at is not None
+
+ def test_unexpected_error_cache_spec(self, memorypcp, pot_request, ie, logger):
+ error_provider = ErrorSpecCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[error_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ cache.store(pot_request, response)
+ assert cache.get(pot_request) is None
+ assert error_provider.generate_called_times == 3
+ assert error_provider.is_available_called_times == 3
+
+ assert 'Error occurred with "invalid" PO Token cache spec provider: ValueError(\'something went wrong\'); please report this issue to the provider developer at (developer has not provided a bug report location) .' in logger.messages['error']
+
+ def test_unexpected_error_cache_spec_fallback(self, memorypcp, pot_request, ie, logger):
+ error_provider = ErrorSpecCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ example_provider = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[error_provider, example_provider],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ assert cache.get(pot_request) is None
+ assert error_provider.generate_called_times == 1
+ assert error_provider.is_available_called_times == 1
+ assert example_provider.generate_called_times == 1
+
+ cache.store(pot_request, response)
+ assert error_provider.generate_called_times == 2
+ assert error_provider.is_available_called_times == 2
+ assert example_provider.generate_called_times == 2
+
+ cached_response = cache.get(pot_request)
+ assert error_provider.generate_called_times == 3
+ assert error_provider.is_available_called_times == 3
+ assert example_provider.generate_called_times == 3
+ assert example_provider.is_available_called_times == 3
+ assert cached_response is not None
+ assert cached_response.po_token == EXAMPLE_PO_TOKEN
+ assert cached_response.expires_at is not None
+
+ assert 'Error occurred with "invalid" PO Token cache spec provider: ValueError(\'something went wrong\'); please report this issue to the provider developer at (developer has not provided a bug report location) .' in logger.messages['error']
+
+ def test_key_bindings_spec_provider(self, memorypcp, pot_request, ie, logger):
+
+ class ExampleProviderPCSP(PoTokenCacheSpecProvider):
+ PROVIDER_NAME = 'example'
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ return PoTokenCacheSpec(
+ key_bindings={'v': request.video_id},
+ default_ttl=60,
+ )
+
+ class ExampleProviderTwoPCSP(ExampleProviderPCSP):
+ pass
+
+ example_provider = ExampleProviderPCSP(ie=ie, logger=logger, settings={})
+ example_provider_two = ExampleProviderTwoPCSP(ie=ie, logger=logger, settings={})
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[example_provider],
+ logger=logger,
+ )
+
+ assert cache.get(pot_request) is None
+ cache.store(pot_request, response)
+ assert len(memorypcp.cache) == 1
+ assert hashlib.sha256(
+ f"{{'_dlp_cache': 'v1', '_p': 'ExampleProvider', 'v': '{pot_request.video_id}'}}".encode()).hexdigest() in memorypcp.cache
+
+ # The second spec provider returns the exact same key bindings as the first one,
+ # however the PoTokenCache should use the provider key to differentiate between them
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[example_provider_two],
+ logger=logger,
+ )
+
+ assert cache.get(pot_request) is None
+ cache.store(pot_request, response)
+ assert len(memorypcp.cache) == 2
+ assert hashlib.sha256(
+ f"{{'_dlp_cache': 'v1', '_p': 'ExampleProviderTwo', 'v': '{pot_request.video_id}'}}".encode()).hexdigest() in memorypcp.cache
+
+ def test_cache_provider_preferences(self, pot_request, ie, logger):
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one, pcp_two],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN), write_policy=CacheProviderWritePolicy.WRITE_FIRST)
+ assert len(pcp_one.cache) == 1
+ assert len(pcp_two.cache) == 0
+
+ assert cache.get(pot_request)
+ assert pcp_one.get_calls == 1
+ assert pcp_two.get_calls == 0
+
+ standard_preference_called = False
+ pcp_one_preference_claled = False
+
+ def standard_preference(provider, request, *_, **__):
+ nonlocal standard_preference_called
+ standard_preference_called = True
+ assert isinstance(provider, PoTokenCacheProvider)
+ assert isinstance(request, PoTokenRequest)
+ return 1
+
+ def pcp_one_preference(provider, request, *_, **__):
+ nonlocal pcp_one_preference_claled
+ pcp_one_preference_claled = True
+ assert isinstance(provider, PoTokenCacheProvider)
+ assert isinstance(request, PoTokenRequest)
+ if provider.PROVIDER_KEY == pcp_one.PROVIDER_KEY:
+ return -100
+ return 0
+
+ # test that it can hanldle multiple preferences
+ cache.cache_provider_preferences.append(standard_preference)
+ cache.cache_provider_preferences.append(pcp_one_preference)
+
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN), write_policy=CacheProviderWritePolicy.WRITE_FIRST)
+ assert cache.get(pot_request)
+ assert len(pcp_one.cache) == len(pcp_two.cache) == 1
+ assert pcp_two.get_calls == pcp_one.get_calls == 1
+ assert pcp_one.store_calls == pcp_two.store_calls == 1
+ assert standard_preference_called
+ assert pcp_one_preference_claled
+
+ def test_secondary_cache_provider_hit(self, pot_request, ie, logger):
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_two],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ # Given the lower priority provider has the cache hit, store the response in the higher priority provider
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN))
+ assert cache.get(pot_request)
+
+ cache.cache_providers[pcp_one.PROVIDER_KEY] = pcp_one
+
+ def pcp_one_pref(provider, *_, **__):
+ if provider.PROVIDER_KEY == pcp_one.PROVIDER_KEY:
+ return 1
+ return -1
+
+ cache.cache_provider_preferences.append(pcp_one_pref)
+
+ assert cache.get(pot_request)
+ assert pcp_one.get_calls == 1
+ assert pcp_two.get_calls == 2
+ # Should write back to pcp_one (now the highest priority cache provider)
+ assert pcp_one.store_calls == pcp_two.store_calls == 1
+ assert 'Writing PO Token response to highest priority cache provider' in logger.messages['trace']
+
+ def test_cache_provider_no_hits(self, pot_request, ie, logger):
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one, pcp_two],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ assert cache.get(pot_request) is None
+ assert pcp_one.get_calls == pcp_two.get_calls == 1
+
+ def test_get_invalid_po_token_response(self, pot_request, ie, logger):
+ # Test various scenarios where the po token response stored in the cache provider is invalid
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one, pcp_two],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ valid_response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, valid_response)
+ assert len(pcp_one.cache) == len(pcp_two.cache) == 1
+ # Overwrite the valid response with an invalid one in the cache
+ pcp_one.store(next(iter(pcp_one.cache.keys())), json.dumps(dataclasses.asdict(PoTokenResponse(None))), int(time.time() + 1000))
+ assert cache.get(pot_request).po_token == valid_response.po_token
+ assert pcp_one.get_calls == pcp_two.get_calls == 1
+ assert pcp_one.delete_calls == 1 # Invalid response should be deleted from cache
+ assert pcp_one.store_calls == 3 # Since response was fetched from second cache provider, it should be stored in the first one
+ assert len(pcp_one.cache) == 1
+ assert 'Invalid PO Token response retrieved from cache provider "memory": {"po_token": null, "expires_at": null}; example bug report message' in logger.messages['error']
+
+ # Overwrite the valid response with an invalid json in the cache
+ pcp_one.store(next(iter(pcp_one.cache.keys())), 'invalid-json', int(time.time() + 1000))
+ assert cache.get(pot_request).po_token == valid_response.po_token
+ assert pcp_one.get_calls == pcp_two.get_calls == 2
+ assert pcp_one.delete_calls == 2
+ assert pcp_one.store_calls == 5 # 3 + 1 store we made in the test + 1 store from lower priority cache provider
+ assert len(pcp_one.cache) == 1
+
+ assert 'Invalid PO Token response retrieved from cache provider "memory": invalid-json; example bug report message' in logger.messages['error']
+
+ # Valid json, but missing required fields
+ pcp_one.store(next(iter(pcp_one.cache.keys())), '{"unknown_param": 0}', int(time.time() + 1000))
+ assert cache.get(pot_request).po_token == valid_response.po_token
+ assert pcp_one.get_calls == pcp_two.get_calls == 3
+ assert pcp_one.delete_calls == 3
+ assert pcp_one.store_calls == 7 # 5 + 1 store from test + 1 store from lower priority cache provider
+ assert len(pcp_one.cache) == 1
+
+ assert 'Invalid PO Token response retrieved from cache provider "memory": {"unknown_param": 0}; example bug report message' in logger.messages['error']
+
+ def test_store_invalid_po_token_response(self, pot_request, ie, logger):
+ # Should not store an invalid po token response
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ cache.store(pot_request, PoTokenResponse(po_token=EXAMPLE_PO_TOKEN, expires_at=80))
+ assert cache.get(pot_request) is None
+ assert pcp_one.store_calls == 0
+ assert 'Invalid PO Token response provided to PoTokenCache.store()' in logger.messages['error'][0]
+
+ def test_store_write_policy(self, pot_request, ie, logger):
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one, pcp_two],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN), write_policy=CacheProviderWritePolicy.WRITE_FIRST)
+ assert pcp_one.store_calls == 1
+ assert pcp_two.store_calls == 0
+
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN), write_policy=CacheProviderWritePolicy.WRITE_ALL)
+ assert pcp_one.store_calls == 2
+ assert pcp_two.store_calls == 1
+
+ def test_store_write_first_policy_cache_spec(self, pot_request, ie, logger):
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ class WriteFirstPCSP(BaseMockCacheSpecProvider):
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return PoTokenCacheSpec(
+ key_bindings={'v': request.video_id, 'e': None},
+ default_ttl=60,
+ write_policy=CacheProviderWritePolicy.WRITE_FIRST,
+ )
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one, pcp_two],
+ cache_spec_providers=[WriteFirstPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN))
+ assert pcp_one.store_calls == 1
+ assert pcp_two.store_calls == 0
+
+ def test_store_write_all_policy_cache_spec(self, pot_request, ie, logger):
+ pcp_one = create_memory_pcp(ie, logger, provider_key='memory_pcp_one')
+ pcp_two = create_memory_pcp(ie, logger, provider_key='memory_pcp_two')
+
+ class WriteAllPCSP(BaseMockCacheSpecProvider):
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return PoTokenCacheSpec(
+ key_bindings={'v': request.video_id, 'e': None},
+ default_ttl=60,
+ write_policy=CacheProviderWritePolicy.WRITE_ALL,
+ )
+
+ cache = PoTokenCache(
+ cache_providers=[pcp_one, pcp_two],
+ cache_spec_providers=[WriteAllPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN))
+ assert pcp_one.store_calls == 1
+ assert pcp_two.store_calls == 1
+
+ def test_expires_at_pot_response(self, pot_request, memorypcp, ie, logger):
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=10000000000)
+ cache.store(pot_request, response)
+ assert next(iter(memorypcp.cache.values()))[1] == 10000000000
+
+ def test_expires_at_default_spec(self, pot_request, memorypcp, ie, logger):
+
+ class TtlPCSP(BaseMockCacheSpecProvider):
+ def generate_cache_spec(self, request: PoTokenRequest):
+ super().generate_cache_spec(request)
+ return PoTokenCacheSpec(
+ key_bindings={'v': request.video_id, 'e': None},
+ default_ttl=10000000000,
+ )
+
+ cache = PoTokenCache(
+ cache_providers=[memorypcp],
+ cache_spec_providers=[TtlPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+ assert next(iter(memorypcp.cache.values()))[1] >= 10000000000
+
+ def test_cache_provider_error_no_fallback(self, pot_request, ie, logger):
+ error_pcp = ErrorPCP(ie, logger, {})
+ cache = PoTokenCache(
+ cache_providers=[error_pcp],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+ assert cache.get(pot_request) is None
+ assert error_pcp.get_calls == 1
+ assert error_pcp.store_calls == 1
+
+ assert logger.messages['warning'].count("Error from \"error\" PO Token cache provider: PoTokenCacheProviderError('something went wrong'); example bug report message") == 2
+
+ def test_cache_provider_error_fallback(self, pot_request, ie, logger):
+ error_pcp = ErrorPCP(ie, logger, {})
+ memory_pcp = create_memory_pcp(ie, logger, provider_key='memory')
+
+ cache = PoTokenCache(
+ cache_providers=[error_pcp, memory_pcp],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+
+ # 1. Store fails for error_pcp, stored in memory_pcp
+ # 2. Get fails for error_pcp, fetched from memory_pcp
+ # 3. Since fetched from lower priority, it should be stored in the highest priority cache provider
+ # 4. Store fails in error_pcp. Since write policy is WRITE_FIRST, it should not try to store in memory_pcp regardless of if the store in error_pcp fails
+
+ assert cache.get(pot_request)
+ assert error_pcp.get_calls == 1
+ assert error_pcp.store_calls == 2 # since highest priority, when fetched from lower priority, it should be stored in the highest priority cache provider
+ assert memory_pcp.get_calls == 1
+ assert memory_pcp.store_calls == 1
+
+ assert logger.messages['warning'].count("Error from \"error\" PO Token cache provider: PoTokenCacheProviderError('something went wrong'); example bug report message") == 3
+
+ def test_cache_provider_unexpected_error_no_fallback(self, pot_request, ie, logger):
+ error_pcp = UnexpectedErrorPCP(ie, logger, {})
+ cache = PoTokenCache(
+ cache_providers=[error_pcp],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+ assert cache.get(pot_request) is None
+ assert error_pcp.get_calls == 1
+ assert error_pcp.store_calls == 1
+
+ assert logger.messages['error'].count("Error occurred with \"unexpected_error\" PO Token cache provider: ValueError('something went wrong'); example bug report message") == 2
+
+ def test_cache_provider_unexpected_error_fallback(self, pot_request, ie, logger):
+ error_pcp = UnexpectedErrorPCP(ie, logger, {})
+ memory_pcp = create_memory_pcp(ie, logger, provider_key='memory')
+
+ cache = PoTokenCache(
+ cache_providers=[error_pcp, memory_pcp],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+
+ # 1. Store fails for error_pcp, stored in memory_pcp
+ # 2. Get fails for error_pcp, fetched from memory_pcp
+ # 3. Since fetched from lower priority, it should be stored in the highest priority cache provider
+ # 4. Store fails in error_pcp. Since write policy is WRITE_FIRST, it should not try to store in memory_pcp regardless of if the store in error_pcp fails
+
+ assert cache.get(pot_request)
+ assert error_pcp.get_calls == 1
+ assert error_pcp.store_calls == 2 # since highest priority, when fetched from lower priority, it should be stored in the highest priority cache provider
+ assert memory_pcp.get_calls == 1
+ assert memory_pcp.store_calls == 1
+
+ assert logger.messages['error'].count("Error occurred with \"unexpected_error\" PO Token cache provider: ValueError('something went wrong'); example bug report message") == 3
+
+ def test_cache_provider_unavailable_no_fallback(self, pot_request, ie, logger):
+ provider = create_memory_pcp(ie, logger, available=False)
+
+ cache = PoTokenCache(
+ cache_providers=[provider],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+ assert cache.get(pot_request) is None
+ assert provider.get_calls == 0
+ assert provider.store_calls == 0
+ assert provider.available_called_times
+
+ def test_cache_provider_unavailable_fallback(self, pot_request, ie, logger):
+ provider_unavailable = create_memory_pcp(ie, logger, provider_key='unavailable', provider_name='unavailable', available=False)
+ provider_available = create_memory_pcp(ie, logger, provider_key='available', provider_name='available')
+
+ cache = PoTokenCache(
+ cache_providers=[provider_unavailable, provider_available],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response)
+ assert cache.get(pot_request) is not None
+ assert provider_unavailable.get_calls == 0
+ assert provider_unavailable.store_calls == 0
+ assert provider_available.get_calls == 1
+ assert provider_available.store_calls == 1
+ assert provider_unavailable.available_called_times
+ assert provider_available.available_called_times
+
+ # should not even try to use the provider for the request
+ assert 'Attempting to fetch a PO Token response from "unavailable" provider' not in logger.messages['trace']
+ assert 'Attempting to fetch a PO Token response from "available" provider' not in logger.messages['trace']
+
+ def test_available_not_called(self, ie, pot_request, logger):
+ # Test that the available method is not called when provider higher in the list is available
+ provider_unavailable = create_memory_pcp(
+ ie, logger, provider_key='unavailable', provider_name='unavailable', available=False)
+ provider_available = create_memory_pcp(ie, logger, provider_key='available', provider_name='available')
+
+ logger.log_level = logger.LogLevel.INFO
+
+ cache = PoTokenCache(
+ cache_providers=[provider_available, provider_unavailable],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response, write_policy=CacheProviderWritePolicy.WRITE_FIRST)
+ assert cache.get(pot_request) is not None
+ assert provider_unavailable.get_calls == 0
+ assert provider_unavailable.store_calls == 0
+ assert provider_available.get_calls == 1
+ assert provider_available.store_calls == 1
+ assert provider_unavailable.available_called_times == 0
+ assert provider_available.available_called_times
+ assert 'PO Token Cache Providers: available-0.0.0 (external), unavailable-0.0.0 (external, unavailable)' not in logger.messages.get('trace', [])
+
+ def test_available_called_trace(self, ie, pot_request, logger):
+ # But if logging level is trace should call available (as part of debug logging)
+ provider_unavailable = create_memory_pcp(
+ ie, logger, provider_key='unavailable', provider_name='unavailable', available=False)
+ provider_available = create_memory_pcp(ie, logger, provider_key='available', provider_name='available')
+
+ logger.log_level = logger.LogLevel.TRACE
+
+ cache = PoTokenCache(
+ cache_providers=[provider_available, provider_unavailable],
+ cache_spec_providers=[ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})],
+ logger=logger,
+ )
+
+ response = PoTokenResponse(EXAMPLE_PO_TOKEN)
+ cache.store(pot_request, response, write_policy=CacheProviderWritePolicy.WRITE_FIRST)
+ assert cache.get(pot_request) is not None
+ assert provider_unavailable.get_calls == 0
+ assert provider_unavailable.store_calls == 0
+ assert provider_available.get_calls == 1
+ assert provider_available.store_calls == 1
+ assert provider_unavailable.available_called_times
+ assert provider_available.available_called_times
+ assert 'PO Token Cache Providers: available-0.0.0 (external), unavailable-0.0.0 (external, unavailable)' in logger.messages.get('trace', [])
+
+ def test_close(self, ie, pot_request, logger):
+ # Should call close on the cache providers and cache specs
+ memory_pcp = create_memory_pcp(ie, logger, provider_key='memory')
+ memory2_pcp = create_memory_pcp(ie, logger, provider_key='memory2')
+
+ spec1 = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ spec2 = UnavailableCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+
+ cache = PoTokenCache(
+ cache_providers=[memory2_pcp, memory_pcp],
+ cache_spec_providers=[spec1, spec2],
+ logger=logger,
+ )
+
+ cache.close()
+ assert memory_pcp.close_called
+ assert memory2_pcp.close_called
+ assert spec1.close_called
+ assert spec2.close_called
+
+
+class TestPoTokenRequestDirector:
+
+ def test_request_pot_success(self, ie, pot_request, pot_cache, pot_provider, logger):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ director.register_provider(pot_provider)
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+
+ def test_request_and_cache(self, ie, pot_request, pot_cache, pot_provider, logger):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ director.register_provider(pot_provider)
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_provider.request_called_times == 1
+ assert pot_cache.get_calls == 1
+ assert pot_cache.store_calls == 1
+
+ # Second request, should be cached
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_cache.get_calls == 2
+ assert pot_cache.store_calls == 1
+ assert pot_provider.request_called_times == 1
+
+ def test_bypass_cache(self, ie, pot_request, pot_cache, logger, pot_provider):
+ pot_request.bypass_cache = True
+
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ director.register_provider(pot_provider)
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_provider.request_called_times == 1
+ assert pot_cache.get_calls == 0
+ assert pot_cache.store_calls == 1
+
+ # Second request, should not get from cache
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_provider.request_called_times == 2
+ assert pot_cache.get_calls == 0
+ assert pot_cache.store_calls == 2
+
+ # POT is still cached, should get from cache
+ pot_request.bypass_cache = False
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_provider.request_called_times == 2
+ assert pot_cache.get_calls == 1
+ assert pot_cache.store_calls == 2
+
+ def test_clean_pot_generate(self, ie, pot_request, pot_cache, logger):
+ # Token should be cleaned before returning
+ base_token = base64.urlsafe_b64encode(b'token').decode()
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = success_ptp(PoTokenResponse(base_token + '?extra=params'))(ie, logger, settings={})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == base_token
+ assert provider.request_called_times == 1
+
+ # Confirm the cleaned version was stored in the cache
+ cached_token = pot_cache.get(pot_request)
+ assert cached_token.po_token == base_token
+
+ def test_clean_pot_cache(self, ie, pot_request, pot_cache, logger, pot_provider):
+ # Token retrieved from cache should be cleaned before returning
+ base_token = base64.urlsafe_b64encode(b'token').decode()
+ pot_cache.store(pot_request, PoTokenResponse(base_token + '?extra=params'))
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ director.register_provider(pot_provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == base_token
+ assert pot_cache.get_calls == 1
+ assert pot_provider.request_called_times == 0
+
+ def test_cache_expires_at_none(self, ie, pot_request, pot_cache, logger, pot_provider):
+ # Should cache if expires_at=None in the response
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = success_ptp(PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=None))(ie, logger, settings={})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_cache.store_calls == 1
+ assert pot_cache.get(pot_request).po_token == EXAMPLE_PO_TOKEN
+
+ def test_cache_expires_at_positive(self, ie, pot_request, pot_cache, logger, pot_provider):
+ # Should cache if expires_at is a positive number in the response
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = success_ptp(PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=99999999999))(ie, logger, settings={})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_cache.store_calls == 1
+ assert pot_cache.get(pot_request).po_token == EXAMPLE_PO_TOKEN
+
+ @pytest.mark.parametrize('expires_at', [0, -1])
+ def test_not_cache_expires_at(self, ie, pot_request, pot_cache, logger, pot_provider, expires_at):
+ # Should not cache if expires_at <= 0 in the response
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = success_ptp(PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=expires_at))(ie, logger, settings={})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert pot_cache.store_calls == 0
+ assert pot_cache.get(pot_request) is None
+
+ def test_no_providers(self, ie, pot_request, pot_cache, logger):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ response = director.get_po_token(pot_request)
+ assert response is None
+
+ def test_try_cache_no_providers(self, ie, pot_request, pot_cache, logger):
+ # Should still try the cache even if no providers are configured
+ pot_cache.store(pot_request, PoTokenResponse(EXAMPLE_PO_TOKEN))
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+
+ def test_close(self, ie, pot_request, pot_cache, pot_provider, logger):
+ # Should call close on the pot cache and any providers
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+
+ provider2 = UnavailablePTP(ie, logger, {})
+ director.register_provider(pot_provider)
+ director.register_provider(provider2)
+
+ director.close()
+ assert pot_provider.close_called
+ assert provider2.close_called
+ assert pot_cache.close_called
+
+ def test_pot_provider_preferences(self, pot_request, pot_cache, ie, logger):
+ pot_request.bypass_cache = True
+ provider_two_pot = base64.urlsafe_b64encode(b'token2').decode()
+
+ example_provider = success_ptp(response=PoTokenResponse(EXAMPLE_PO_TOKEN), key='exampleone')(ie, logger, settings={})
+ example_provider_two = success_ptp(response=PoTokenResponse(provider_two_pot), key='exampletwo')(ie, logger, settings={})
+
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ director.register_provider(example_provider)
+ director.register_provider(example_provider_two)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert example_provider.request_called_times == 1
+ assert example_provider_two.request_called_times == 0
+
+ standard_preference_called = False
+ example_preference_called = False
+
+ # Test that the provider preferences are respected
+ def standard_preference(provider, request, *_, **__):
+ nonlocal standard_preference_called
+ standard_preference_called = True
+ assert isinstance(provider, PoTokenProvider)
+ assert isinstance(request, PoTokenRequest)
+ return 1
+
+ def example_preference(provider, request, *_, **__):
+ nonlocal example_preference_called
+ example_preference_called = True
+ assert isinstance(provider, PoTokenProvider)
+ assert isinstance(request, PoTokenRequest)
+ if provider.PROVIDER_KEY == example_provider.PROVIDER_KEY:
+ return -100
+ return 0
+
+ # test that it can handle multiple preferences
+ director.register_preference(example_preference)
+ director.register_preference(standard_preference)
+
+ response = director.get_po_token(pot_request)
+ assert response == provider_two_pot
+ assert example_provider.request_called_times == 1
+ assert example_provider_two.request_called_times == 1
+ assert standard_preference_called
+ assert example_preference_called
+
+ def test_unsupported_request_no_fallback(self, ie, logger, pot_cache, pot_request):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnsupportedPTP(ie, logger, {})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 1
+
+ def test_unsupported_request_fallback(self, ie, logger, pot_cache, pot_request, pot_provider):
+ # Should fallback to the next provider if the first one does not support the request
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnsupportedPTP(ie, logger, {})
+ director.register_provider(provider)
+ director.register_provider(pot_provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 1
+ assert pot_provider.request_called_times == 1
+ assert 'PO Token Provider "unsupported" rejected this request, trying next available provider. Reason: unsupported request' in logger.messages['trace']
+
+ def test_unavailable_request_no_fallback(self, ie, logger, pot_cache, pot_request):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnavailablePTP(ie, logger, {})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 0
+ assert provider.available_called_times
+
+ def test_unavailable_request_fallback(self, ie, logger, pot_cache, pot_request, pot_provider):
+ # Should fallback to the next provider if the first one is unavailable
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnavailablePTP(ie, logger, {})
+ director.register_provider(provider)
+ director.register_provider(pot_provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 0
+ assert provider.available_called_times
+ assert pot_provider.request_called_times == 1
+ assert pot_provider.available_called_times
+ # should not even try use the provider for the request
+ assert 'Attempting to fetch a PO Token from "unavailable" provider' not in logger.messages['trace']
+ assert 'Attempting to fetch a PO Token from "success" provider' in logger.messages['trace']
+
+ def test_available_not_called(self, ie, logger, pot_cache, pot_request, pot_provider):
+ # Test that the available method is not called when provider higher in the list is available
+ logger.log_level = logger.LogLevel.INFO
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnavailablePTP(ie, logger, {})
+ director.register_provider(pot_provider)
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 0
+ assert provider.available_called_times == 0
+ assert pot_provider.request_called_times == 1
+ assert pot_provider.available_called_times == 2
+ assert 'PO Token Providers: success-0.0.1 (external), unavailable-0.0.0 (external, unavailable)' not in logger.messages.get('trace', [])
+
+ def test_available_called_trace(self, ie, logger, pot_cache, pot_request, pot_provider):
+ # But if logging level is trace should call available (as part of debug logging)
+ logger.log_level = logger.LogLevel.TRACE
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnavailablePTP(ie, logger, {})
+ director.register_provider(pot_provider)
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 0
+ assert provider.available_called_times == 1
+ assert pot_provider.request_called_times == 1
+ assert pot_provider.available_called_times == 3
+ assert 'PO Token Providers: success-0.0.1 (external), unavailable-0.0.0 (external, unavailable)' in logger.messages['trace']
+
+ def test_provider_error_no_fallback_unexpected(self, ie, logger, pot_cache, pot_request):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = ErrorPTP(ie, logger, {})
+ director.register_provider(provider)
+ pot_request.video_id = 'unexpected'
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 1
+ assert "Error fetching PO Token from \"error\" provider: PoTokenProviderError('an error occurred'); please report this issue to the provider developer at https://error.example.com/issues ." in logger.messages['warning']
+
+ def test_provider_error_no_fallback_expected(self, ie, logger, pot_cache, pot_request):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = ErrorPTP(ie, logger, {})
+ director.register_provider(provider)
+ pot_request.video_id = 'expected'
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 1
+ assert "Error fetching PO Token from \"error\" provider: PoTokenProviderError('an error occurred')" in logger.messages['warning']
+
+ def test_provider_error_fallback(self, ie, logger, pot_cache, pot_request, pot_provider):
+ # Should fallback to the next provider if the first one raises an error
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = ErrorPTP(ie, logger, {})
+ director.register_provider(provider)
+ director.register_provider(pot_provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 1
+ assert pot_provider.request_called_times == 1
+ assert "Error fetching PO Token from \"error\" provider: PoTokenProviderError('an error occurred'); please report this issue to the provider developer at https://error.example.com/issues ." in logger.messages['warning']
+
+ def test_provider_unexpected_error_no_fallback(self, ie, logger, pot_cache, pot_request):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnexpectedErrorPTP(ie, logger, {})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 1
+ assert "Unexpected error when fetching PO Token from \"unexpected_error\" provider: ValueError('an unexpected error occurred'); please report this issue to the provider developer at https://unexpected.example.com/issues ." in logger.messages['error']
+
+ def test_provider_unexpected_error_fallback(self, ie, logger, pot_cache, pot_request, pot_provider):
+ # Should fallback to the next provider if the first one raises an unexpected error
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = UnexpectedErrorPTP(ie, logger, {})
+ director.register_provider(provider)
+ director.register_provider(pot_provider)
+
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 1
+ assert pot_provider.request_called_times == 1
+ assert "Unexpected error when fetching PO Token from \"unexpected_error\" provider: ValueError('an unexpected error occurred'); please report this issue to the provider developer at https://unexpected.example.com/issues ." in logger.messages['error']
+
+ def test_invalid_po_token_response_type(self, ie, logger, pot_cache, pot_request, pot_provider):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = InvalidPTP(ie, logger, {})
+ director.register_provider(provider)
+
+ pot_request.video_id = 'invalid_type'
+
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 1
+ assert 'Invalid PO Token response received from "invalid" provider: invalid-response; please report this issue to the provider developer at https://invalid.example.com/issues .' in logger.messages['error']
+
+ # Should fallback to next available provider
+ director.register_provider(pot_provider)
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 2
+ assert pot_provider.request_called_times == 1
+
+ def test_invalid_po_token_response(self, ie, logger, pot_cache, pot_request, pot_provider):
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+ provider = InvalidPTP(ie, logger, {})
+ director.register_provider(provider)
+
+ response = director.get_po_token(pot_request)
+ assert response is None
+ assert provider.request_called_times == 1
+ assert "Invalid PO Token response received from \"invalid\" provider: PoTokenResponse(po_token='example-token?', expires_at='123'); please report this issue to the provider developer at https://invalid.example.com/issues ." in logger.messages['error']
+
+ # Should fallback to next available provider
+ director.register_provider(pot_provider)
+ response = director.get_po_token(pot_request)
+ assert response == EXAMPLE_PO_TOKEN
+ assert provider.request_called_times == 2
+ assert pot_provider.request_called_times == 1
+
+ def test_copy_request_provider(self, ie, logger, pot_cache, pot_request):
+
+ class BadProviderPTP(BaseMockPoTokenProvider):
+ _SUPPORTED_CONTEXTS = None
+ _SUPPORTED_CLIENTS = None
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ # Providers should not modify the request object, but we should guard against it
+ request.video_id = 'bad'
+ raise PoTokenProviderRejectedRequest('bad request')
+
+ class GoodProviderPTP(BaseMockPoTokenProvider):
+ _SUPPORTED_CONTEXTS = None
+ _SUPPORTED_CLIENTS = None
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ return PoTokenResponse(base64.urlsafe_b64encode(request.video_id.encode()).decode())
+
+ director = PoTokenRequestDirector(logger=logger, cache=pot_cache)
+
+ bad_provider = BadProviderPTP(ie, logger, {})
+ good_provider = GoodProviderPTP(ie, logger, {})
+
+ director.register_provider(bad_provider)
+ director.register_provider(good_provider)
+
+ pot_request.video_id = 'good'
+ response = director.get_po_token(pot_request)
+ assert response == base64.urlsafe_b64encode(b'good').decode()
+ assert bad_provider.request_called_times == 1
+ assert good_provider.request_called_times == 1
+ assert pot_request.video_id == 'good'
+
+
+@pytest.mark.parametrize('spec, expected', [
+ (None, False),
+ (PoTokenCacheSpec(key_bindings={'v': 'video-id'}, default_ttl=60, write_policy=None), False), # type: ignore
+ (PoTokenCacheSpec(key_bindings={'v': 'video-id'}, default_ttl='invalid'), False), # type: ignore
+ (PoTokenCacheSpec(key_bindings='invalid', default_ttl=60), False), # type: ignore
+ (PoTokenCacheSpec(key_bindings={2: 'video-id'}, default_ttl=60), False), # type: ignore
+ (PoTokenCacheSpec(key_bindings={'v': 2}, default_ttl=60), False), # type: ignore
+ (PoTokenCacheSpec(key_bindings={'v': None}, default_ttl=60), False), # type: ignore
+
+ (PoTokenCacheSpec(key_bindings={'v': 'video_id', 'e': None}, default_ttl=60), True),
+ (PoTokenCacheSpec(key_bindings={'v': 'video_id'}, default_ttl=60, write_policy=CacheProviderWritePolicy.WRITE_FIRST), True),
+])
+def test_validate_cache_spec(spec, expected):
+ assert validate_cache_spec(spec) == expected
+
+
+@pytest.mark.parametrize('po_token', [
+ 'invalid-token?',
+ '123',
+])
+def test_clean_pot_fail(po_token):
+ with pytest.raises(ValueError, match='Invalid PO Token'):
+ clean_pot(po_token)
+
+
+@pytest.mark.parametrize('po_token,expected', [
+ ('TwAA/+8=', 'TwAA_-8='),
+ ('TwAA%5F%2D9VA6Q92v%5FvEQ4==?extra-param=2', 'TwAA_-9VA6Q92v_vEQ4='),
+])
+def test_clean_pot(po_token, expected):
+ assert clean_pot(po_token) == expected
+
+
+@pytest.mark.parametrize(
+ 'response, expected',
+ [
+ (None, False),
+ (PoTokenResponse(None), False),
+ (PoTokenResponse(1), False),
+ (PoTokenResponse('invalid-token?'), False),
+ (PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at='abc'), False), # type: ignore
+ (PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=100), False),
+ (PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=time.time() + 10000.0), False), # type: ignore
+ (PoTokenResponse(EXAMPLE_PO_TOKEN), True),
+ (PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=-1), True),
+ (PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=0), True),
+ (PoTokenResponse(EXAMPLE_PO_TOKEN, expires_at=int(time.time()) + 10000), True),
+ ],
+)
+def test_validate_pot_response(response, expected):
+ assert validate_response(response) == expected
+
+
+def test_built_in_provider(ie, logger):
+ class BuiltinProviderDefaultT(BuiltinIEContentProvider, suffix='T'):
+ def is_available(self):
+ return True
+
+ class BuiltinProviderCustomNameT(BuiltinIEContentProvider, suffix='T'):
+ PROVIDER_NAME = 'CustomName'
+
+ def is_available(self):
+ return True
+
+ class ExternalProviderDefaultT(IEContentProvider, suffix='T'):
+ def is_available(self):
+ return True
+
+ class ExternalProviderCustomT(IEContentProvider, suffix='T'):
+ PROVIDER_NAME = 'custom'
+ PROVIDER_VERSION = '5.4b2'
+
+ def is_available(self):
+ return True
+
+ class ExternalProviderUnavailableT(IEContentProvider, suffix='T'):
+ def is_available(self) -> bool:
+ return False
+
+ class BuiltinProviderUnavailableT(IEContentProvider, suffix='T'):
+ def is_available(self) -> bool:
+ return False
+
+ built_in_default = BuiltinProviderDefaultT(ie=ie, logger=logger, settings={})
+ built_in_custom_name = BuiltinProviderCustomNameT(ie=ie, logger=logger, settings={})
+ built_in_unavailable = BuiltinProviderUnavailableT(ie=ie, logger=logger, settings={})
+ external_default = ExternalProviderDefaultT(ie=ie, logger=logger, settings={})
+ external_custom = ExternalProviderCustomT(ie=ie, logger=logger, settings={})
+ external_unavailable = ExternalProviderUnavailableT(ie=ie, logger=logger, settings={})
+
+ assert provider_display_list([]) == 'none'
+ assert provider_display_list([built_in_default]) == 'BuiltinProviderDefault'
+ assert provider_display_list([external_unavailable]) == 'ExternalProviderUnavailable-0.0.0 (external, unavailable)'
+ assert provider_display_list([
+ built_in_default,
+ built_in_custom_name,
+ external_default,
+ external_custom,
+ external_unavailable,
+ built_in_unavailable],
+ ) == 'BuiltinProviderDefault, CustomName, ExternalProviderDefault-0.0.0 (external), custom-5.4b2 (external), ExternalProviderUnavailable-0.0.0 (external, unavailable), BuiltinProviderUnavailable-0.0.0 (external, unavailable)'
diff --git a/test/test_pot/test_pot_framework.py b/test/test_pot/test_pot_framework.py
new file mode 100644
index 000000000..bc94653f4
--- /dev/null
+++ b/test/test_pot/test_pot_framework.py
@@ -0,0 +1,629 @@
+import pytest
+
+from yt_dlp.extractor.youtube.pot._provider import IEContentProvider
+from yt_dlp.cookies import YoutubeDLCookieJar
+from yt_dlp.utils.networking import HTTPHeaderDict
+from yt_dlp.extractor.youtube.pot.provider import (
+ PoTokenRequest,
+ PoTokenContext,
+ ExternalRequestFeature,
+
+)
+
+from yt_dlp.extractor.youtube.pot.cache import (
+ PoTokenCacheProvider,
+ PoTokenCacheSpec,
+ PoTokenCacheSpecProvider,
+ CacheProviderWritePolicy,
+)
+
+import yt_dlp.extractor.youtube.pot.cache as cache
+
+from yt_dlp.networking import Request
+from yt_dlp.extractor.youtube.pot.provider import (
+ PoTokenResponse,
+ PoTokenProvider,
+ PoTokenProviderRejectedRequest,
+ provider_bug_report_message,
+ register_provider,
+ register_preference,
+)
+
+from yt_dlp.extractor.youtube.pot._registry import _pot_providers, _ptp_preferences, _pot_pcs_providers, _pot_cache_providers, _pot_cache_provider_preferences
+
+
+class ExamplePTP(PoTokenProvider):
+ PROVIDER_NAME = 'example'
+ PROVIDER_VERSION = '0.0.1'
+ BUG_REPORT_LOCATION = 'https://example.com/issues'
+
+ _SUPPORTED_CLIENTS = ('WEB',)
+ _SUPPORTED_CONTEXTS = (PoTokenContext.GVS, )
+
+ _SUPPORTED_EXTERNAL_REQUEST_FEATURES = (
+ ExternalRequestFeature.PROXY_SCHEME_HTTP,
+ ExternalRequestFeature.PROXY_SCHEME_SOCKS5H,
+ )
+
+ def is_available(self) -> bool:
+ return True
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ return PoTokenResponse('example-token', expires_at=123)
+
+
+class ExampleCacheProviderPCP(PoTokenCacheProvider):
+
+ PROVIDER_NAME = 'example'
+ PROVIDER_VERSION = '0.0.1'
+ BUG_REPORT_LOCATION = 'https://example.com/issues'
+
+ def is_available(self) -> bool:
+ return True
+
+ def get(self, key: str):
+ return 'example-cache'
+
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+
+class ExampleCacheSpecProviderPCSP(PoTokenCacheSpecProvider):
+
+ PROVIDER_NAME = 'example'
+ PROVIDER_VERSION = '0.0.1'
+ BUG_REPORT_LOCATION = 'https://example.com/issues'
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ return PoTokenCacheSpec(
+ key_bindings={'field': 'example-key'},
+ default_ttl=60,
+ write_policy=CacheProviderWritePolicy.WRITE_FIRST,
+ )
+
+
+class TestPoTokenProvider:
+
+ def test_base_type(self):
+ assert issubclass(PoTokenProvider, IEContentProvider)
+
+ def test_create_provider_missing_fetch_method(self, ie, logger):
+ class MissingMethodsPTP(PoTokenProvider):
+ def is_available(self) -> bool:
+ return True
+
+ with pytest.raises(TypeError):
+ MissingMethodsPTP(ie=ie, logger=logger, settings={})
+
+ def test_create_provider_missing_available_method(self, ie, logger):
+ class MissingMethodsPTP(PoTokenProvider):
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise PoTokenProviderRejectedRequest('Not implemented')
+
+ with pytest.raises(TypeError):
+ MissingMethodsPTP(ie=ie, logger=logger, settings={})
+
+ def test_barebones_provider(self, ie, logger):
+ class BarebonesProviderPTP(PoTokenProvider):
+ def is_available(self) -> bool:
+ return True
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise PoTokenProviderRejectedRequest('Not implemented')
+
+ provider = BarebonesProviderPTP(ie=ie, logger=logger, settings={})
+ assert provider.PROVIDER_NAME == 'BarebonesProvider'
+ assert provider.PROVIDER_KEY == 'BarebonesProvider'
+ assert provider.PROVIDER_VERSION == '0.0.0'
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at (developer has not provided a bug report location) .'
+
+ def test_example_provider_success(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+ assert provider.PROVIDER_NAME == 'example'
+ assert provider.PROVIDER_KEY == 'Example'
+ assert provider.PROVIDER_VERSION == '0.0.1'
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at https://example.com/issues .'
+ assert provider.is_available()
+
+ response = provider.request_pot(pot_request)
+
+ assert response.po_token == 'example-token'
+ assert response.expires_at == 123
+
+ def test_provider_unsupported_context(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+ pot_request.context = PoTokenContext.PLAYER
+
+ with pytest.raises(PoTokenProviderRejectedRequest):
+ provider.request_pot(pot_request)
+
+ def test_provider_unsupported_client(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+ pot_request.innertube_context['client']['clientName'] = 'ANDROID'
+
+ with pytest.raises(PoTokenProviderRejectedRequest):
+ provider.request_pot(pot_request)
+
+ def test_provider_unsupported_proxy_scheme(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+ pot_request.request_proxy = 'socks4://example.com'
+
+ with pytest.raises(
+ PoTokenProviderRejectedRequest,
+ match='External requests by "example" provider do not support proxy scheme "socks4". Supported proxy '
+ 'schemes: http, socks5h',
+ ):
+ provider.request_pot(pot_request)
+
+ pot_request.request_proxy = 'http://example.com'
+
+ assert provider.request_pot(pot_request)
+
+ def test_provider_ignore_external_request_features(self, ie, logger, pot_request):
+ class InternalPTP(ExamplePTP):
+ _SUPPORTED_EXTERNAL_REQUEST_FEATURES = None
+
+ provider = InternalPTP(ie=ie, logger=logger, settings={})
+
+ pot_request.request_proxy = 'socks5://example.com'
+ assert provider.request_pot(pot_request)
+ pot_request.request_source_address = '0.0.0.0'
+ assert provider.request_pot(pot_request)
+
+ def test_provider_unsupported_external_request_source_address(self, ie, logger, pot_request):
+ class InternalPTP(ExamplePTP):
+ _SUPPORTED_EXTERNAL_REQUEST_FEATURES = tuple()
+
+ provider = InternalPTP(ie=ie, logger=logger, settings={})
+
+ pot_request.request_source_address = None
+ assert provider.request_pot(pot_request)
+
+ pot_request.request_source_address = '0.0.0.0'
+ with pytest.raises(
+ PoTokenProviderRejectedRequest,
+ match='External requests by "example" provider do not support setting source address',
+ ):
+ provider.request_pot(pot_request)
+
+ def test_provider_supported_external_request_source_address(self, ie, logger, pot_request):
+ class InternalPTP(ExamplePTP):
+ _SUPPORTED_EXTERNAL_REQUEST_FEATURES = (
+ ExternalRequestFeature.SOURCE_ADDRESS,
+ )
+
+ provider = InternalPTP(ie=ie, logger=logger, settings={})
+
+ pot_request.request_source_address = None
+ assert provider.request_pot(pot_request)
+
+ pot_request.request_source_address = '0.0.0.0'
+ assert provider.request_pot(pot_request)
+
+ def test_provider_unsupported_external_request_tls_verification(self, ie, logger, pot_request):
+ class InternalPTP(ExamplePTP):
+ _SUPPORTED_EXTERNAL_REQUEST_FEATURES = tuple()
+
+ provider = InternalPTP(ie=ie, logger=logger, settings={})
+
+ pot_request.request_verify_tls = True
+ assert provider.request_pot(pot_request)
+
+ pot_request.request_verify_tls = False
+ with pytest.raises(
+ PoTokenProviderRejectedRequest,
+ match='External requests by "example" provider do not support ignoring TLS certificate failures',
+ ):
+ provider.request_pot(pot_request)
+
+ def test_provider_supported_external_request_tls_verification(self, ie, logger, pot_request):
+ class InternalPTP(ExamplePTP):
+ _SUPPORTED_EXTERNAL_REQUEST_FEATURES = (
+ ExternalRequestFeature.DISABLE_TLS_VERIFICATION,
+ )
+
+ provider = InternalPTP(ie=ie, logger=logger, settings={})
+
+ pot_request.request_verify_tls = True
+ assert provider.request_pot(pot_request)
+
+ pot_request.request_verify_tls = False
+ assert provider.request_pot(pot_request)
+
+ def test_provider_request_webpage(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+
+ cookiejar = YoutubeDLCookieJar()
+ pot_request.request_headers = HTTPHeaderDict({'User-Agent': 'example-user-agent'})
+ pot_request.request_proxy = 'socks5://example-proxy.com'
+ pot_request.request_cookiejar = cookiejar
+
+ def mock_urlopen(request):
+ return request
+
+ ie._downloader.urlopen = mock_urlopen
+
+ sent_request = provider._request_webpage(Request(
+ 'https://example.com',
+ ), pot_request=pot_request)
+
+ assert sent_request.url == 'https://example.com'
+ assert sent_request.headers['User-Agent'] == 'example-user-agent'
+ assert sent_request.proxies == {'all': 'socks5://example-proxy.com'}
+ assert sent_request.extensions['cookiejar'] is cookiejar
+ assert 'Requesting webpage' in logger.messages['info']
+
+ def test_provider_request_webpage_override(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+
+ cookiejar_request = YoutubeDLCookieJar()
+ pot_request.request_headers = HTTPHeaderDict({'User-Agent': 'example-user-agent'})
+ pot_request.request_proxy = 'socks5://example-proxy.com'
+ pot_request.request_cookiejar = cookiejar_request
+
+ def mock_urlopen(request):
+ return request
+
+ ie._downloader.urlopen = mock_urlopen
+
+ sent_request = provider._request_webpage(Request(
+ 'https://example.com',
+ headers={'User-Agent': 'override-user-agent-override'},
+ proxies={'http': 'http://example-proxy-override.com'},
+ extensions={'cookiejar': YoutubeDLCookieJar()},
+ ), pot_request=pot_request, note='Custom requesting webpage')
+
+ assert sent_request.url == 'https://example.com'
+ assert sent_request.headers['User-Agent'] == 'override-user-agent-override'
+ assert sent_request.proxies == {'http': 'http://example-proxy-override.com'}
+ assert sent_request.extensions['cookiejar'] is not cookiejar_request
+ assert 'Custom requesting webpage' in logger.messages['info']
+
+ def test_provider_request_webpage_no_log(self, ie, logger, pot_request):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+
+ def mock_urlopen(request):
+ return request
+
+ ie._downloader.urlopen = mock_urlopen
+
+ sent_request = provider._request_webpage(Request(
+ 'https://example.com',
+ ), note=False)
+
+ assert sent_request.url == 'https://example.com'
+ assert 'info' not in logger.messages
+
+ def test_provider_request_webpage_no_pot_request(self, ie, logger):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+
+ def mock_urlopen(request):
+ return request
+
+ ie._downloader.urlopen = mock_urlopen
+
+ sent_request = provider._request_webpage(Request(
+ 'https://example.com',
+ ), pot_request=None)
+
+ assert sent_request.url == 'https://example.com'
+
+ def test_get_config_arg(self, ie, logger):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={'abc': ['123D'], 'xyz': ['456a', '789B']})
+
+ assert provider._configuration_arg('abc') == ['123d']
+ assert provider._configuration_arg('abc', default=['default']) == ['123d']
+ assert provider._configuration_arg('ABC', default=['default']) == ['default']
+ assert provider._configuration_arg('abc', casesense=True) == ['123D']
+ assert provider._configuration_arg('xyz', casesense=False) == ['456a', '789b']
+
+ def test_require_class_end_with_suffix(self, ie, logger):
+ class InvalidSuffix(PoTokenProvider):
+ PROVIDER_NAME = 'invalid-suffix'
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise PoTokenProviderRejectedRequest('Not implemented')
+
+ def is_available(self) -> bool:
+ return True
+
+ provider = InvalidSuffix(ie=ie, logger=logger, settings={})
+
+ with pytest.raises(AssertionError):
+ provider.PROVIDER_KEY # noqa: B018
+
+
+class TestPoTokenCacheProvider:
+
+ def test_base_type(self):
+ assert issubclass(PoTokenCacheProvider, IEContentProvider)
+
+ def test_create_provider_missing_get_method(self, ie, logger):
+ class MissingMethodsPCP(PoTokenCacheProvider):
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+ def is_available(self) -> bool:
+ return True
+
+ with pytest.raises(TypeError):
+ MissingMethodsPCP(ie=ie, logger=logger, settings={})
+
+ def test_create_provider_missing_store_method(self, ie, logger):
+ class MissingMethodsPCP(PoTokenCacheProvider):
+ def get(self, key: str):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+ def is_available(self) -> bool:
+ return True
+
+ with pytest.raises(TypeError):
+ MissingMethodsPCP(ie=ie, logger=logger, settings={})
+
+ def test_create_provider_missing_delete_method(self, ie, logger):
+ class MissingMethodsPCP(PoTokenCacheProvider):
+ def get(self, key: str):
+ pass
+
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def is_available(self) -> bool:
+ return True
+
+ with pytest.raises(TypeError):
+ MissingMethodsPCP(ie=ie, logger=logger, settings={})
+
+ def test_create_provider_missing_is_available_method(self, ie, logger):
+ class MissingMethodsPCP(PoTokenCacheProvider):
+ def get(self, key: str):
+ pass
+
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+ with pytest.raises(TypeError):
+ MissingMethodsPCP(ie=ie, logger=logger, settings={})
+
+ def test_barebones_provider(self, ie, logger):
+ class BarebonesProviderPCP(PoTokenCacheProvider):
+
+ def is_available(self) -> bool:
+ return True
+
+ def get(self, key: str):
+ return 'example-cache'
+
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+ provider = BarebonesProviderPCP(ie=ie, logger=logger, settings={})
+ assert provider.PROVIDER_NAME == 'BarebonesProvider'
+ assert provider.PROVIDER_KEY == 'BarebonesProvider'
+ assert provider.PROVIDER_VERSION == '0.0.0'
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at (developer has not provided a bug report location) .'
+
+ def test_create_provider_example(self, ie, logger):
+ provider = ExampleCacheProviderPCP(ie=ie, logger=logger, settings={})
+ assert provider.PROVIDER_NAME == 'example'
+ assert provider.PROVIDER_KEY == 'ExampleCacheProvider'
+ assert provider.PROVIDER_VERSION == '0.0.1'
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at https://example.com/issues .'
+ assert provider.is_available()
+
+ def test_get_config_arg(self, ie, logger):
+ provider = ExampleCacheProviderPCP(ie=ie, logger=logger, settings={'abc': ['123D'], 'xyz': ['456a', '789B']})
+ assert provider._configuration_arg('abc') == ['123d']
+ assert provider._configuration_arg('abc', default=['default']) == ['123d']
+ assert provider._configuration_arg('ABC', default=['default']) == ['default']
+ assert provider._configuration_arg('abc', casesense=True) == ['123D']
+ assert provider._configuration_arg('xyz', casesense=False) == ['456a', '789b']
+
+ def test_require_class_end_with_suffix(self, ie, logger):
+ class InvalidSuffix(PoTokenCacheProvider):
+ def get(self, key: str):
+ return 'example-cache'
+
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+ def is_available(self) -> bool:
+ return True
+
+ provider = InvalidSuffix(ie=ie, logger=logger, settings={})
+
+ with pytest.raises(AssertionError):
+ provider.PROVIDER_KEY # noqa: B018
+
+
+class TestPoTokenCacheSpecProvider:
+
+ def test_base_type(self):
+ assert issubclass(PoTokenCacheSpecProvider, IEContentProvider)
+
+ def test_create_provider_missing_supports_method(self, ie, logger):
+ class MissingMethodsPCS(PoTokenCacheSpecProvider):
+ pass
+
+ with pytest.raises(TypeError):
+ MissingMethodsPCS(ie=ie, logger=logger, settings={})
+
+ def test_create_provider_barebones(self, ie, pot_request, logger):
+ class BarebonesProviderPCSP(PoTokenCacheSpecProvider):
+ def generate_cache_spec(self, request: PoTokenRequest):
+ return PoTokenCacheSpec(
+ default_ttl=100,
+ key_bindings={},
+ )
+
+ provider = BarebonesProviderPCSP(ie=ie, logger=logger, settings={})
+ assert provider.PROVIDER_NAME == 'BarebonesProvider'
+ assert provider.PROVIDER_KEY == 'BarebonesProvider'
+ assert provider.PROVIDER_VERSION == '0.0.0'
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at (developer has not provided a bug report location) .'
+ assert provider.is_available()
+ assert provider.generate_cache_spec(request=pot_request).default_ttl == 100
+ assert provider.generate_cache_spec(request=pot_request).key_bindings == {}
+ assert provider.generate_cache_spec(request=pot_request).write_policy == CacheProviderWritePolicy.WRITE_ALL
+
+ def test_create_provider_example(self, ie, pot_request, logger):
+ provider = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={})
+ assert provider.PROVIDER_NAME == 'example'
+ assert provider.PROVIDER_KEY == 'ExampleCacheSpecProvider'
+ assert provider.PROVIDER_VERSION == '0.0.1'
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at https://example.com/issues .'
+ assert provider.is_available()
+ assert provider.generate_cache_spec(pot_request)
+ assert provider.generate_cache_spec(pot_request).key_bindings == {'field': 'example-key'}
+ assert provider.generate_cache_spec(pot_request).default_ttl == 60
+ assert provider.generate_cache_spec(pot_request).write_policy == CacheProviderWritePolicy.WRITE_FIRST
+
+ def test_get_config_arg(self, ie, logger):
+ provider = ExampleCacheSpecProviderPCSP(ie=ie, logger=logger, settings={'abc': ['123D'], 'xyz': ['456a', '789B']})
+
+ assert provider._configuration_arg('abc') == ['123d']
+ assert provider._configuration_arg('abc', default=['default']) == ['123d']
+ assert provider._configuration_arg('ABC', default=['default']) == ['default']
+ assert provider._configuration_arg('abc', casesense=True) == ['123D']
+ assert provider._configuration_arg('xyz', casesense=False) == ['456a', '789b']
+
+ def test_require_class_end_with_suffix(self, ie, logger):
+ class InvalidSuffix(PoTokenCacheSpecProvider):
+ def generate_cache_spec(self, request: PoTokenRequest):
+ return None
+
+ provider = InvalidSuffix(ie=ie, logger=logger, settings={})
+
+ with pytest.raises(AssertionError):
+ provider.PROVIDER_KEY # noqa: B018
+
+
+class TestPoTokenRequest:
+ def test_copy_request(self, pot_request):
+ copied_request = pot_request.copy()
+
+ assert copied_request is not pot_request
+ assert copied_request.context == pot_request.context
+ assert copied_request.innertube_context == pot_request.innertube_context
+ assert copied_request.innertube_context is not pot_request.innertube_context
+ copied_request.innertube_context['client']['clientName'] = 'ANDROID'
+ assert pot_request.innertube_context['client']['clientName'] != 'ANDROID'
+ assert copied_request.innertube_host == pot_request.innertube_host
+ assert copied_request.session_index == pot_request.session_index
+ assert copied_request.player_url == pot_request.player_url
+ assert copied_request.is_authenticated == pot_request.is_authenticated
+ assert copied_request.visitor_data == pot_request.visitor_data
+ assert copied_request.data_sync_id == pot_request.data_sync_id
+ assert copied_request.video_id == pot_request.video_id
+ assert copied_request.request_cookiejar is pot_request.request_cookiejar
+ assert copied_request.request_proxy == pot_request.request_proxy
+ assert copied_request.request_headers == pot_request.request_headers
+ assert copied_request.request_headers is not pot_request.request_headers
+ assert copied_request.request_timeout == pot_request.request_timeout
+ assert copied_request.request_source_address == pot_request.request_source_address
+ assert copied_request.request_verify_tls == pot_request.request_verify_tls
+ assert copied_request.bypass_cache == pot_request.bypass_cache
+
+
+def test_provider_bug_report_message(ie, logger):
+ provider = ExamplePTP(ie=ie, logger=logger, settings={})
+ assert provider.BUG_REPORT_MESSAGE == 'please report this issue to the provider developer at https://example.com/issues .'
+
+ message = provider_bug_report_message(provider)
+ assert message == '; please report this issue to the provider developer at https://example.com/issues .'
+
+ message_before = provider_bug_report_message(provider, before='custom message!')
+ assert message_before == 'custom message! Please report this issue to the provider developer at https://example.com/issues .'
+
+
+def test_register_provider(ie):
+
+ @register_provider
+ class UnavailableProviderPTP(PoTokenProvider):
+ def is_available(self) -> bool:
+ return False
+
+ def _real_request_pot(self, request: PoTokenRequest) -> PoTokenResponse:
+ raise PoTokenProviderRejectedRequest('Not implemented')
+
+ assert _pot_providers.value.get('UnavailableProvider') == UnavailableProviderPTP
+ _pot_providers.value.pop('UnavailableProvider')
+
+
+def test_register_pot_preference(ie):
+ before = len(_ptp_preferences.value)
+
+ @register_preference(ExamplePTP)
+ def unavailable_preference(provider: PoTokenProvider, request: PoTokenRequest):
+ return 1
+
+ assert len(_ptp_preferences.value) == before + 1
+
+
+def test_register_cache_provider(ie):
+
+ @cache.register_provider
+ class UnavailableCacheProviderPCP(PoTokenCacheProvider):
+ def is_available(self) -> bool:
+ return False
+
+ def get(self, key: str):
+ return 'example-cache'
+
+ def store(self, key: str, value: str, expires_at: int):
+ pass
+
+ def delete(self, key: str):
+ pass
+
+ assert _pot_cache_providers.value.get('UnavailableCacheProvider') == UnavailableCacheProviderPCP
+ _pot_cache_providers.value.pop('UnavailableCacheProvider')
+
+
+def test_register_cache_provider_spec(ie):
+
+ @cache.register_spec
+ class UnavailableCacheProviderPCSP(PoTokenCacheSpecProvider):
+ def is_available(self) -> bool:
+ return False
+
+ def generate_cache_spec(self, request: PoTokenRequest):
+ return None
+
+ assert _pot_pcs_providers.value.get('UnavailableCacheProvider') == UnavailableCacheProviderPCSP
+ _pot_pcs_providers.value.pop('UnavailableCacheProvider')
+
+
+def test_register_cache_provider_preference(ie):
+ before = len(_pot_cache_provider_preferences.value)
+
+ @cache.register_preference(ExampleCacheProviderPCP)
+ def unavailable_preference(provider: PoTokenCacheProvider, request: PoTokenRequest):
+ return 1
+
+ assert len(_pot_cache_provider_preferences.value) == before + 1
+
+
+def test_logger_log_level(logger):
+ assert logger.LogLevel('INFO') == logger.LogLevel.INFO
+ assert logger.LogLevel('debuG') == logger.LogLevel.DEBUG
+ assert logger.LogLevel(10) == logger.LogLevel.DEBUG
+ assert logger.LogLevel('UNKNOWN') == logger.LogLevel.INFO
diff --git a/test/test_youtube_signature.py b/test/test_youtube_signature.py
index 0f0885366..3336b6bff 100644
--- a/test/test_youtube_signature.py
+++ b/test/test_youtube_signature.py
@@ -316,6 +316,18 @@
'https://www.youtube.com/s/player/8a8ac953/tv-player-es6.vflset/tv-player-es6.js',
'MiBYeXx_vRREbiCCmh', 'RtZYMVvmkE0JE',
),
+ (
+ 'https://www.youtube.com/s/player/59b252b9/player_ias.vflset/en_US/base.js',
+ 'D3XWVpYgwhLLKNK4AGX', 'aZrQ1qWJ5yv5h',
+ ),
+ (
+ 'https://www.youtube.com/s/player/fc2a56a5/player_ias.vflset/en_US/base.js',
+ 'qTKWg_Il804jd2kAC', 'OtUAm2W6gyzJjB9u',
+ ),
+ (
+ 'https://www.youtube.com/s/player/fc2a56a5/tv-player-ias.vflset/tv-player-ias.js',
+ 'qTKWg_Il804jd2kAC', 'OtUAm2W6gyzJjB9u',
+ ),
]
diff --git a/test/testdata/thumbnails/foo %d bar/foo_%d.webp b/test/testdata/thumbnails/foo %d bar/foo_%d.webp
deleted file mode 100644
index d64d0839f..000000000
Binary files a/test/testdata/thumbnails/foo %d bar/foo_%d.webp and /dev/null differ
diff --git a/test/testdata/thumbnails/foo %d bar/placeholder b/test/testdata/thumbnails/foo %d bar/placeholder
new file mode 100644
index 000000000..e69de29bb
diff --git a/yt_dlp/YoutubeDL.py b/yt_dlp/YoutubeDL.py
index 7021c2d89..7c4ff8f33 100644
--- a/yt_dlp/YoutubeDL.py
+++ b/yt_dlp/YoutubeDL.py
@@ -491,7 +491,7 @@ class YoutubeDL:
The template is mapped on a dictionary with keys 'progress' and 'info'
retry_sleep_functions: Dictionary of functions that takes the number of attempts
as argument and returns the time to sleep in seconds.
- Allowed keys are 'http', 'fragment', 'file_access'
+ Allowed keys are 'http', 'fragment', 'file_access', 'extractor'
download_ranges: A callback function that gets called for every video with
the signature (info_dict, ydl) -> Iterable[Section].
Only the returned sections will be downloaded.
@@ -641,6 +641,7 @@ def __init__(self, params=None, auto_init=True):
self._printed_messages = set()
self._first_webpage_request = True
self._post_hooks = []
+ self._close_hooks = []
self._progress_hooks = []
self._postprocessor_hooks = []
self._download_retcode = 0
@@ -909,6 +910,11 @@ def add_post_hook(self, ph):
"""Add the post hook"""
self._post_hooks.append(ph)
+ def add_close_hook(self, ch):
+ """Add a close hook, called when YoutubeDL.close() is called"""
+ assert callable(ch), 'Close hook must be callable'
+ self._close_hooks.append(ch)
+
def add_progress_hook(self, ph):
"""Add the download progress hook"""
self._progress_hooks.append(ph)
@@ -1017,6 +1023,9 @@ def close(self):
self._request_director.close()
del self._request_director
+ for close_hook in self._close_hooks:
+ close_hook()
+
def trouble(self, message=None, tb=None, is_error=True):
"""Determine action to take when a download problem appears.
diff --git a/yt_dlp/cookies.py b/yt_dlp/cookies.py
index fad323c90..5675445ac 100644
--- a/yt_dlp/cookies.py
+++ b/yt_dlp/cookies.py
@@ -764,11 +764,11 @@ def _get_linux_desktop_environment(env, logger):
GetDesktopEnvironment
"""
xdg_current_desktop = env.get('XDG_CURRENT_DESKTOP', None)
- desktop_session = env.get('DESKTOP_SESSION', None)
+ desktop_session = env.get('DESKTOP_SESSION', '')
if xdg_current_desktop is not None:
for part in map(str.strip, xdg_current_desktop.split(':')):
if part == 'Unity':
- if desktop_session is not None and 'gnome-fallback' in desktop_session:
+ if 'gnome-fallback' in desktop_session:
return _LinuxDesktopEnvironment.GNOME
else:
return _LinuxDesktopEnvironment.UNITY
@@ -797,35 +797,34 @@ def _get_linux_desktop_environment(env, logger):
return _LinuxDesktopEnvironment.UKUI
elif part == 'LXQt':
return _LinuxDesktopEnvironment.LXQT
- logger.info(f'XDG_CURRENT_DESKTOP is set to an unknown value: "{xdg_current_desktop}"')
+ logger.debug(f'XDG_CURRENT_DESKTOP is set to an unknown value: "{xdg_current_desktop}"')
- elif desktop_session is not None:
- if desktop_session == 'deepin':
- return _LinuxDesktopEnvironment.DEEPIN
- elif desktop_session in ('mate', 'gnome'):
- return _LinuxDesktopEnvironment.GNOME
- elif desktop_session in ('kde4', 'kde-plasma'):
+ if desktop_session == 'deepin':
+ return _LinuxDesktopEnvironment.DEEPIN
+ elif desktop_session in ('mate', 'gnome'):
+ return _LinuxDesktopEnvironment.GNOME
+ elif desktop_session in ('kde4', 'kde-plasma'):
+ return _LinuxDesktopEnvironment.KDE4
+ elif desktop_session == 'kde':
+ if 'KDE_SESSION_VERSION' in env:
return _LinuxDesktopEnvironment.KDE4
- elif desktop_session == 'kde':
- if 'KDE_SESSION_VERSION' in env:
- return _LinuxDesktopEnvironment.KDE4
- else:
- return _LinuxDesktopEnvironment.KDE3
- elif 'xfce' in desktop_session or desktop_session == 'xubuntu':
- return _LinuxDesktopEnvironment.XFCE
- elif desktop_session == 'ukui':
- return _LinuxDesktopEnvironment.UKUI
else:
- logger.info(f'DESKTOP_SESSION is set to an unknown value: "{desktop_session}"')
-
+ return _LinuxDesktopEnvironment.KDE3
+ elif 'xfce' in desktop_session or desktop_session == 'xubuntu':
+ return _LinuxDesktopEnvironment.XFCE
+ elif desktop_session == 'ukui':
+ return _LinuxDesktopEnvironment.UKUI
else:
- if 'GNOME_DESKTOP_SESSION_ID' in env:
- return _LinuxDesktopEnvironment.GNOME
- elif 'KDE_FULL_SESSION' in env:
- if 'KDE_SESSION_VERSION' in env:
- return _LinuxDesktopEnvironment.KDE4
- else:
- return _LinuxDesktopEnvironment.KDE3
+ logger.debug(f'DESKTOP_SESSION is set to an unknown value: "{desktop_session}"')
+
+ if 'GNOME_DESKTOP_SESSION_ID' in env:
+ return _LinuxDesktopEnvironment.GNOME
+ elif 'KDE_FULL_SESSION' in env:
+ if 'KDE_SESSION_VERSION' in env:
+ return _LinuxDesktopEnvironment.KDE4
+ else:
+ return _LinuxDesktopEnvironment.KDE3
+
return _LinuxDesktopEnvironment.OTHER
diff --git a/yt_dlp/extractor/_extractors.py b/yt_dlp/extractor/_extractors.py
index e7dcb9853..34c98b537 100644
--- a/yt_dlp/extractor/_extractors.py
+++ b/yt_dlp/extractor/_extractors.py
@@ -300,7 +300,6 @@
BrainPOPIlIE,
BrainPOPJrIE,
)
-from .bravotv import BravoTVIE
from .breitbart import BreitBartIE
from .brightcove import (
BrightcoveLegacyIE,
@@ -1262,6 +1261,7 @@
)
from .nbc import (
NBCIE,
+ BravoTVIE,
NBCNewsIE,
NBCOlympicsIE,
NBCOlympicsStreamIE,
@@ -1269,6 +1269,7 @@
NBCSportsStreamIE,
NBCSportsVPlayerIE,
NBCStationsIE,
+ SyfyIE,
)
from .ndr import (
NDRIE,
@@ -2016,13 +2017,11 @@
SverigesRadioPublicationIE,
)
from .svt import (
- SVTIE,
SVTPageIE,
SVTPlayIE,
SVTSeriesIE,
)
from .swearnet import SwearnetEpisodeIE
-from .syfy import SyfyIE
from .syvdk import SYVDKIE
from .sztvhu import SztvHuIE
from .tagesschau import TagesschauIE
@@ -2147,6 +2146,7 @@
from .toggo import ToggoIE
from .tonline import TOnlineIE
from .toongoggles import ToonGogglesIE
+from .toutiao import ToutiaoIE
from .toutv import TouTvIE
from .toypics import (
ToypicsIE,
@@ -2369,6 +2369,7 @@
VHXEmbedIE,
VimeoAlbumIE,
VimeoChannelIE,
+ VimeoEventIE,
VimeoGroupsIE,
VimeoIE,
VimeoLikesIE,
diff --git a/yt_dlp/extractor/adobepass.py b/yt_dlp/extractor/adobepass.py
index f1b877927..8c2d9d934 100644
--- a/yt_dlp/extractor/adobepass.py
+++ b/yt_dlp/extractor/adobepass.py
@@ -3,6 +3,7 @@
import re
import time
import urllib.parse
+import uuid
import xml.etree.ElementTree as etree
from .common import InfoExtractor
@@ -10,6 +11,7 @@
from ..utils import (
NO_DEFAULT,
ExtractorError,
+ parse_qs,
unescapeHTML,
unified_timestamp,
urlencode_postdata,
@@ -45,6 +47,8 @@
'name': 'Comcast XFINITY',
'username_field': 'user',
'password_field': 'passwd',
+ 'login_hostname': 'login.xfinity.com',
+ 'needs_newer_ua': True,
},
'TWC': {
'name': 'Time Warner Cable | Spectrum',
@@ -74,6 +78,12 @@
'name': 'Verizon FiOS',
'username_field': 'IDToken1',
'password_field': 'IDToken2',
+ 'login_hostname': 'ssoauth.verizon.com',
+ },
+ 'Fubo': {
+ 'name': 'Fubo',
+ 'username_field': 'username',
+ 'password_field': 'password',
},
'Cablevision': {
'name': 'Optimum/Cablevision',
@@ -1338,6 +1348,7 @@
'name': 'Sling TV',
'username_field': 'username',
'password_field': 'password',
+ 'login_hostname': 'identity.sling.com',
},
'Suddenlink': {
'name': 'Suddenlink',
@@ -1355,7 +1366,6 @@
class AdobePassIE(InfoExtractor): # XXX: Conventionally, base classes should end with BaseIE/InfoExtractor
_SERVICE_PROVIDER_TEMPLATE = 'https://sp.auth.adobe.com/adobe-services/%s'
_USER_AGENT = 'Mozilla/5.0 (X11; Linux i686; rv:47.0) Gecko/20100101 Firefox/47.0'
- _MODERN_USER_AGENT = 'Mozilla/5.0 (Windows NT 10.0; rv:131.0) Gecko/20100101 Firefox/131.0'
_MVPD_CACHE = 'ap-mvpd'
_DOWNLOADING_LOGIN_PAGE = 'Downloading Provider Login Page'
@@ -1367,6 +1377,14 @@ def _download_webpage_handle(self, *args, **kwargs):
return super()._download_webpage_handle(
*args, **kwargs)
+ @staticmethod
+ def _get_mso_headers(mso_info):
+ # yt-dlp's default user-agent is usually too old for some MSO's like Comcast_SSO
+ # See: https://github.com/yt-dlp/yt-dlp/issues/10848
+ return {
+ 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; rv:131.0) Gecko/20100101 Firefox/131.0',
+ } if mso_info.get('needs_newer_ua') else {}
+
@staticmethod
def _get_mvpd_resource(provider_id, title, guid, rating):
channel = etree.Element('channel')
@@ -1382,7 +1400,13 @@ def _get_mvpd_resource(provider_id, title, guid, rating):
resource_rating.text = rating
return '