104 lines
3.0 KiB
Python
Raw Normal View History

# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
2019-07-07 23:04:09 +02:00
class RTVSTVIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?rtvs\.sk/(?:televizia)/archiv/\d+/(?P<id>\d+)'
_TEST = {
'url': 'http://www.rtvs.sk/televizia/archiv/8249/63118',
'md5': '85e2c55cf988403b70cac24f5c086dc6',
'info_dict': {
2019-06-29 19:10:17 +02:00
'id': '17189',
'ext': 'mp4',
'title': 'Amaro Džives - Náš deň',
'description': 'Galavečer pri príležitosti Medzinárodného dňa Rómov.'
},
'params': {
'skip_download': True,
}
2019-07-07 23:04:09 +02:00
}
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
playlist_url = self._search_regex(
2019-06-29 19:10:17 +02:00
r'url = (["\'])(?:https?:)?(?://)(?P<url>(?:(?!\1).)+)\1', webpage,
'playlist url', group='url')
2019-06-29 19:10:17 +02:00
if not playlist_url.startswith("http"):
playlist_url = "http://" + playlist_url
data = self._download_json(
2019-06-29 19:10:17 +02:00
playlist_url, video_id, 'Downloading playlist')
2019-07-07 23:04:09 +02:00
data_media = data['clip']
2019-06-29 19:10:17 +02:00
media_id = data_media['mediaid']
title = data_media['title']
description = data_media.get('description')
thumbnail = data_media.get('image')
2019-07-07 23:04:09 +02:00
urldl = data_media['sources'][0]['src']
formats = self._extract_m3u8_formats(
urldl, video_id, 'mp4',
entry_protocol='m3u8_native', m3u8_id='hls')
2019-06-29 19:10:17 +02:00
2019-07-07 23:04:09 +02:00
return {
2019-06-29 19:10:17 +02:00
'id': media_id,
'title': title,
'description': description,
'thumbnail': thumbnail,
2019-07-07 23:04:09 +02:00
'formats': formats
2019-06-29 19:10:17 +02:00
}
2019-07-07 23:04:09 +02:00
class RTVSRADIOIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?rtvs\.sk/(?:radio)/archiv/\d+/(?P<id>\d+)'
_TEST = {
'url': 'http://www.rtvs.sk/radio/archiv/11224/414872',
'md5': '134d5d6debdeddf8a5d761cbc9edacb8',
'info_dict': {
'id': '135320',
'ext': 'mp3',
'title': 'Ostrov pokladov 1 časť.mp3'
},
'params': {
'skip_download': True,
}
}
def _real_extract(self, url):
video_id = self._match_id(url)
2019-06-29 19:10:17 +02:00
2019-07-07 23:04:09 +02:00
webpage = self._download_webpage(url, video_id)
playlist_url = self._search_regex(
r'url = (["\'])(?:https?:)?(?://)(?P<url>(?:(?!\1).)+)\1', webpage,
'playlist url', group='url')
if not playlist_url.startswith("http"):
playlist_url = "http://" + playlist_url
data = self._download_json(
playlist_url, video_id, 'Downloading playlist')
data_media = data['playlist'][0]
media_id = data_media['mediaid']
title = data_media['title']
description = data_media.get('description')
thumbnail = data_media.get('image')
urldl = data_media['sources'][0]['src']
return {
'id': media_id,
'title': title,
'description': description,
'thumbnail': thumbnail,
'url': urldl
}