[hhu] Add new extractor
This commit is contained in:
parent
74bc299453
commit
5426937075
@ -438,6 +438,7 @@ from .hellporno import HellPornoIE
|
|||||||
from .helsinki import HelsinkiIE
|
from .helsinki import HelsinkiIE
|
||||||
from .hentaistigma import HentaiStigmaIE
|
from .hentaistigma import HentaiStigmaIE
|
||||||
from .hgtv import HGTVComShowIE
|
from .hgtv import HGTVComShowIE
|
||||||
|
from .hhu import HHUIE
|
||||||
from .hketv import HKETVIE
|
from .hketv import HKETVIE
|
||||||
from .hidive import HiDiveIE
|
from .hidive import HiDiveIE
|
||||||
from .historicfilms import HistoricFilmsIE
|
from .historicfilms import HistoricFilmsIE
|
||||||
|
72
youtube_dl/extractor/hhu.py
Normal file
72
youtube_dl/extractor/hhu.py
Normal file
@ -0,0 +1,72 @@
|
|||||||
|
# coding: utf-8
|
||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
from .common import InfoExtractor
|
||||||
|
|
||||||
|
|
||||||
|
class HHUIE(InfoExtractor):
|
||||||
|
_VALID_URL = r'https://mediathek\.hhu\.de/watch/(?P<id>.+)'
|
||||||
|
_TEST = {
|
||||||
|
'url': 'https://mediathek.hhu.de/watch/2dd05982-ea45-4108-9620-0c36e6ed8df5',
|
||||||
|
'md5': 'b99ff77f2148b1e754555abdf53f0e51',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '2dd05982-ea45-4108-9620-0c36e6ed8df5',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Das Multimediazentrum',
|
||||||
|
'description': '',
|
||||||
|
'uploader_id': 'clames',
|
||||||
|
'thumbnail': 'https://mediathek.hhu.de/thumbs/2dd05982-ea45-4108-9620-0c36e6ed8df5/thumb_000.jpg',
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
# TODO: Login for some videos.
|
||||||
|
video_id = self._match_id(url)
|
||||||
|
webpage, webpage_url = self._download_webpage_handle(url, video_id)
|
||||||
|
if webpage_url.geturl().startswith("https://sts."):
|
||||||
|
self.raise_login_required()
|
||||||
|
file_id = self._html_search_regex(
|
||||||
|
r"{ file: '\/movies\/(.+?)\/v_100\.mp4', label: '",
|
||||||
|
webpage, 'file_id'
|
||||||
|
)
|
||||||
|
formats = [
|
||||||
|
({'url': format_url.format(file_id)})
|
||||||
|
for format_url in (
|
||||||
|
'https://mediathek.hhu.de/movies/{}/v_10.webm',
|
||||||
|
'https://mediathek.hhu.de/movies/{}/v_10.mp4',
|
||||||
|
'https://mediathek.hhu.de/movies/{}/v_50.webm',
|
||||||
|
'https://mediathek.hhu.de/movies/{}/v_50.mp4',
|
||||||
|
'https://mediathek.hhu.de/movies/{}/v_100.webm',
|
||||||
|
'https://mediathek.hhu.de/movies/{}/v_100.mp4',
|
||||||
|
)
|
||||||
|
]
|
||||||
|
try:
|
||||||
|
title = self._og_search_title(webpage)
|
||||||
|
except:
|
||||||
|
title = self._html_search_regex(
|
||||||
|
r'<h1 id="mt_watch-headline-title">\s+(.+?)\s+<\/h1>',
|
||||||
|
webpage, 'title'
|
||||||
|
)
|
||||||
|
try:
|
||||||
|
description = self._og_search_description(webpage)
|
||||||
|
except:
|
||||||
|
description = self._html_search_regex(
|
||||||
|
r'<p id="mt_watch-description" class="watch-description">\s+(.+?)\s+<\/p>',
|
||||||
|
webpage, 'description', fatal=False
|
||||||
|
)
|
||||||
|
thumbnail = self._og_search_property(
|
||||||
|
'image:secure_url', webpage, 'thumbnail'
|
||||||
|
)
|
||||||
|
uploader_id = self._html_search_regex(
|
||||||
|
r'<a id="mt_content_placeholder_videoinfo_createdby" class="author" href=".+">(.+?)<\/a>',
|
||||||
|
webpage, 'uploader', fatal=False
|
||||||
|
)
|
||||||
|
|
||||||
|
return {
|
||||||
|
'id': video_id,
|
||||||
|
'title': title,
|
||||||
|
'description': description,
|
||||||
|
'uploader_id': uploader_id,
|
||||||
|
'thumbnail': thumbnail,
|
||||||
|
'formats': formats,
|
||||||
|
}
|
Loading…
x
Reference in New Issue
Block a user