From cf25e8d345e5cf2a33eac6cd17fdad31f5d9f93c Mon Sep 17 00:00:00 2001 From: Ben Rog-Wilhelm Date: Sun, 12 May 2019 20:53:07 -0700 Subject: [PATCH 1/3] Add Kaltura support for an uncommon typo in a GDC Vault page --- youtube_dl/extractor/kaltura.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/youtube_dl/extractor/kaltura.py b/youtube_dl/extractor/kaltura.py index 639d73837..48204492b 100644 --- a/youtube_dl/extractor/kaltura.py +++ b/youtube_dl/extractor/kaltura.py @@ -135,7 +135,7 @@ class KalturaIE(InfoExtractor): ''', webpage) or re.search( r'''(?xs) - <(?:iframe[^>]+src|meta[^>]+\bcontent)=(?P["']) + <(?:iframe[^>]+src|meta[^>]+\bcontent)=(?P["'])[ ]? (?:https?:)?//(?:(?:www|cdnapi(?:sec)?)\.)?kaltura\.com/(?:(?!(?P=q1)).)*\b(?:p|partner_id)/(?P\d+) (?:(?!(?P=q1)).)* [?&;]entry_id=(?P(?:(?!(?P=q1))[^&])+) From b6436bb03b419a855494d997d97040a6747cc453 Mon Sep 17 00:00:00 2001 From: Ben Rog-Wilhelm Date: Mon, 13 May 2019 00:15:12 -0700 Subject: [PATCH 2/3] Extend Kaltura whitespace stripping to unlimited amounts of all whitespace --- youtube_dl/extractor/kaltura.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/youtube_dl/extractor/kaltura.py b/youtube_dl/extractor/kaltura.py index 48204492b..8ee231969 100644 --- a/youtube_dl/extractor/kaltura.py +++ b/youtube_dl/extractor/kaltura.py @@ -135,7 +135,7 @@ class KalturaIE(InfoExtractor): ''', webpage) or re.search( r'''(?xs) - <(?:iframe[^>]+src|meta[^>]+\bcontent)=(?P["'])[ ]? + <(?:iframe[^>]+src|meta[^>]+\bcontent)=(?P["'])\s* (?:https?:)?//(?:(?:www|cdnapi(?:sec)?)\.)?kaltura\.com/(?:(?!(?P=q1)).)*\b(?:p|partner_id)/(?P\d+) (?:(?!(?P=q1)).)* [?&;]entry_id=(?P(?:(?!(?P=q1))[^&])+) From 9294cc5a8c3e04c7a94f2f15e76cbf4242ac7d89 Mon Sep 17 00:00:00 2001 From: Ben Rog-Wilhelm Date: Mon, 13 May 2019 00:46:56 -0700 Subject: [PATCH 3/3] Add test --- youtube_dl/extractor/kaltura.py | 16 +++++++++++++++- 1 file changed, 15 insertions(+), 1 deletion(-) diff --git a/youtube_dl/extractor/kaltura.py b/youtube_dl/extractor/kaltura.py index 8ee231969..0317852ee 100644 --- a/youtube_dl/extractor/kaltura.py +++ b/youtube_dl/extractor/kaltura.py @@ -103,7 +103,21 @@ class KalturaIE(InfoExtractor): { 'url': 'https://www.kaltura.com:443/index.php/extwidget/preview/partner_id/1770401/uiconf_id/37307382/entry_id/0_58u8kme7/embed/iframe?&flashvars[streamerType]=auto', 'only_matching': True, - } + }, + { + 'url': 'https://www.gdcvault.com/play/1025699', + 'info_dict': { + 'id': '0_zagynv0a', + 'ext': 'mp4', + 'title': 'Tech Toolbox', + 'upload_date': '20190408', + 'uploader_id': 'joe@blazestreaming.com', + 'timestamp': 1554764629, + }, + 'params': { + 'skip_download': True, + }, + }, ] @staticmethod