2017-10-19 17:17:20 +02:00
|
|
|
# coding: utf-8
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
2019-02-24 23:19:15 +07:00
|
|
|
import re
|
|
|
|
|
2017-10-19 17:17:20 +02:00
|
|
|
from .common import InfoExtractor
|
2020-04-13 15:07:57 +02:00
|
|
|
from ..utils import ExtractorError, JSON_LD_RE
|
2017-10-19 17:17:20 +02:00
|
|
|
|
|
|
|
|
|
|
|
class ServusIE(InfoExtractor):
|
2020-03-03 01:40:48 +07:00
|
|
|
_VALID_URL = r'''(?x)
|
|
|
|
https?://
|
|
|
|
(?:www\.)?
|
|
|
|
(?:
|
|
|
|
servus\.com/(?:(?:at|de)/p/[^/]+|tv/videos)|
|
|
|
|
servustv\.com/videos
|
|
|
|
)
|
|
|
|
/(?P<id>[aA]{2}-\w+|\d+-\d+)
|
|
|
|
'''
|
2017-10-19 17:17:20 +02:00
|
|
|
_TESTS = [{
|
2020-03-03 01:40:48 +07:00
|
|
|
# new URL schema
|
|
|
|
'url': 'https://www.servustv.com/videos/aa-1t6vbu5pw1w12/',
|
2020-04-13 15:07:57 +02:00
|
|
|
'md5': '9f825d6ec14b3d8bebc5b23d094e1e51',
|
2017-10-19 17:17:20 +02:00
|
|
|
'info_dict': {
|
|
|
|
'id': 'AA-1T6VBU5PW1W12',
|
|
|
|
'ext': 'mp4',
|
2019-02-24 23:19:15 +07:00
|
|
|
'title': 'Die Grünen aus Sicht des Volkes',
|
|
|
|
'description': 'md5:1247204d85783afe3682644398ff2ec4',
|
2020-04-13 15:07:57 +02:00
|
|
|
'upload_date': '20170911',
|
|
|
|
'timestamp': 1505147648,
|
2017-10-19 17:17:20 +02:00
|
|
|
}
|
2020-03-03 01:40:48 +07:00
|
|
|
}, {
|
|
|
|
# old URL schema
|
|
|
|
'url': 'https://www.servus.com/de/p/Die-Gr%C3%BCnen-aus-Sicht-des-Volkes/AA-1T6VBU5PW1W12/',
|
|
|
|
'only_matching': True,
|
2017-10-19 17:17:20 +02:00
|
|
|
}, {
|
|
|
|
'url': 'https://www.servus.com/at/p/Wie-das-Leben-beginnt/1309984137314-381415152/',
|
|
|
|
'only_matching': True,
|
2019-02-24 23:19:15 +07:00
|
|
|
}, {
|
|
|
|
'url': 'https://www.servus.com/tv/videos/aa-1t6vbu5pw1w12/',
|
|
|
|
'only_matching': True,
|
|
|
|
}, {
|
|
|
|
'url': 'https://www.servus.com/tv/videos/1380889096408-1235196658/',
|
|
|
|
'only_matching': True,
|
2017-10-19 17:17:20 +02:00
|
|
|
}]
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
2019-02-24 23:19:15 +07:00
|
|
|
video_id = self._match_id(url).upper()
|
2017-10-19 17:17:20 +02:00
|
|
|
webpage = self._download_webpage(url, video_id)
|
|
|
|
|
2020-04-13 15:07:57 +02:00
|
|
|
if 'rbmh-video-player-trigger' not in webpage:
|
|
|
|
raise ExtractorError('Video not available (maybe not aired yet)', expected=True, video_id=video_id)
|
2017-10-19 17:17:20 +02:00
|
|
|
|
2020-04-13 15:07:57 +02:00
|
|
|
info = {}
|
|
|
|
for match in re.finditer(JSON_LD_RE, webpage):
|
|
|
|
json_ld = match.group('json_ld')
|
|
|
|
info = self._json_ld(json_ld, video_id)
|
|
|
|
if info:
|
|
|
|
break
|
|
|
|
else:
|
|
|
|
raise ExtractorError('Could not extract video URL', video_id=video_id)
|
2017-10-19 17:17:20 +02:00
|
|
|
|
2020-04-13 15:07:57 +02:00
|
|
|
info['id'] = video_id
|
|
|
|
info['formats'] = self._extract_m3u8_formats(info['url'], video_id, 'mp4')
|
|
|
|
self._sort_formats(info['formats'])
|
|
|
|
|
|
|
|
return info
|