1
0
mirror of https://github.com/yt-dlp/yt-dlp.git synced 2025-10-24 03:08:34 +00:00

[kaltura] Improve widget ID extraction (closes #11480)

This commit is contained in:
Yen Chi Hsuan 2016-12-20 18:45:52 +08:00
parent c80db5d398
commit 8ab7e6c4cc
No known key found for this signature in database
GPG Key ID: 7F902A182457CA23
3 changed files with 24 additions and 1 deletions

View File

@ -1,3 +1,9 @@
version <unreleased>
Extractors
* [kaltura] Fix wrong widget ID in some cases (#11480)
version 2016.12.18 version 2016.12.18
Core Core

View File

@ -972,6 +972,20 @@ class GenericIE(InfoExtractor):
'skip_download': True, 'skip_download': True,
} }
}, },
{
# Kaltura embedded, some fileExt broken (#11480)
'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
'info_dict': {
'id': '1_sgtvehim',
'ext': 'mp4',
'title': 'Our "Standard Models" of particle physics and cosmology',
'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
'timestamp': 1321158993,
'upload_date': '20111113',
'uploader_id': 'kps1',
},
'add_ie': ['Kaltura'],
},
# Eagle.Platform embed (generic URL) # Eagle.Platform embed (generic URL)
{ {
'url': 'http://lenta.ru/news/2015/03/06/navalny/', 'url': 'http://lenta.ru/news/2015/03/06/navalny/',

View File

@ -107,7 +107,7 @@ def _extract_url(webpage):
(?P<q1>['\"])wid(?P=q1)\s*:\s* (?P<q1>['\"])wid(?P=q1)\s*:\s*
(?P<q2>['\"])_?(?P<partner_id>(?:(?!(?P=q2)).)+)(?P=q2),.*? (?P<q2>['\"])_?(?P<partner_id>(?:(?!(?P=q2)).)+)(?P=q2),.*?
(?P<q3>['\"])entry_?[Ii]d(?P=q3)\s*:\s* (?P<q3>['\"])entry_?[Ii]d(?P=q3)\s*:\s*
(?P<q4>['\"])(?P<id>(?:(?!(?P=q4)).)+)(?P=q4), (?P<q4>['\"])(?P<id>(?:(?!(?P=q4)).)+)(?P=q4)(?:,|\s*\})
""", webpage) or """, webpage) or
re.search( re.search(
r'''(?xs) r'''(?xs)
@ -266,6 +266,9 @@ def sign_url(unsigned_url):
# skip for now. # skip for now.
if f.get('fileExt') == 'chun': if f.get('fileExt') == 'chun':
continue continue
if not f.get('fileExt') and f.get('containerFormat') == 'qt':
# QT indicates QuickTime; some videos have broken fileExt
f['fileExt'] = 'mov'
video_url = sign_url( video_url = sign_url(
'%s/flavorId/%s' % (data_url, f['id'])) '%s/flavorId/%s' % (data_url, f['id']))
# audio-only has no videoCodecId (e.g. kaltura:1926081:0_c03e1b5g # audio-only has no videoCodecId (e.g. kaltura:1926081:0_c03e1b5g