From d6b9e85f5c19c78bd2ef8fbf72dff9ee98e90c03 Mon Sep 17 00:00:00 2001 From: freibadschwimmer Date: Fri, 9 Nov 2018 14:50:45 +0200 Subject: [PATCH] [servushockeynight.com] Add new extractor --- youtube_dl/extractor/extractors.py | 1 + youtube_dl/extractor/servushockeynight.py | 35 +++++++++++++++++++++++ 2 files changed, 36 insertions(+) create mode 100644 youtube_dl/extractor/servushockeynight.py diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py index e5488cce4..71e0163f4 100644 --- a/youtube_dl/extractor/extractors.py +++ b/youtube_dl/extractor/extractors.py @@ -983,6 +983,7 @@ from .senateisvp import SenateISVPIE from .sendtonews import SendtoNewsIE from .servingsys import ServingSysIE from .servus import ServusIE +from .servushockeynight import servushockeynightIE from .sevenplus import SevenPlusIE from .sexu import SexuIE from .seznamzpravy import ( diff --git a/youtube_dl/extractor/servushockeynight.py b/youtube_dl/extractor/servushockeynight.py new file mode 100644 index 000000000..b4f2c564a --- /dev/null +++ b/youtube_dl/extractor/servushockeynight.py @@ -0,0 +1,35 @@ +# coding: utf-8 +from __future__ import unicode_literals + +from .common import InfoExtractor + + +class servushockeynightIE(InfoExtractor): + _VALID_URL = r'http?://(?:www\.)?servushockeynight\.com/(?P[0-9]+)' + _TEST = { + 'url': 'http://servushockeynight.com/videos/runde-17-graz-vs-kac-das-ganze-spiel-zum-nachsehen/', + 'md5': '7ff5e10e45e08062fb94270b88a39948', + 'info_dict': { + 'id': '5857499729001', + 'ext': 'mp4', + 'title': 'Runde 17: Graz vs. Klagenfurt // Saison 18/19 - Ganzes Spiel', + 'timestamp': 1541359757, + 'uploader_id': '3213846503001', + 'upload_date': '20181104', + } + } + + def _real_extract(self, url): + video_id = self._match_id(url) + webpage = self._download_webpage(url, video_id) + + title = self._html_search_regex(r'

(.+?)

', webpage, 'title') + description = self._og_search_description(webpage) + thumbnail = self._og_search_thumbnail(webpage) + + return { + 'id': video_id, + 'title': title, + 'description': self._og_search_description(webpage), + 'uploader': self._search_regex(r']+id="uploader"[^>]*>([^<]+)<', webpage, 'uploader', fatal=False), + }