2016-06-30 14:57:42 +02:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
from .common import InfoExtractor
|
2018-10-22 19:41:17 -04:00
|
|
|
from ..utils import ExtractorError, int_or_none
|
2016-06-30 14:57:42 +02:00
|
|
|
|
|
|
|
|
|
|
|
class FusionIE(InfoExtractor):
|
2018-02-17 05:54:52 -08:00
|
|
|
_VALID_URL = r'https?://(?:www\.)?fusion\.(?:net|tv)/video/(?P<id>\d+)'
|
2016-07-02 02:44:37 +07:00
|
|
|
_TESTS = [{
|
2018-02-17 05:54:52 -08:00
|
|
|
'url': 'http://fusion.tv/video/201781/u-s-and-panamanian-forces-work-together-to-stop-a-vessel-smuggling-drugs/',
|
2016-06-30 14:57:42 +02:00
|
|
|
'info_dict': {
|
2018-10-22 19:41:17 -04:00
|
|
|
'id': '0eaph8eeMwQ',
|
2016-06-30 14:57:42 +02:00
|
|
|
'ext': 'mp4',
|
|
|
|
'title': 'U.S. and Panamanian forces work together to stop a vessel smuggling drugs',
|
|
|
|
'description': 'md5:0cc84a9943c064c0f46b128b41b1b0d7',
|
2018-10-22 19:41:17 -04:00
|
|
|
'uploader': 'FUSION',
|
|
|
|
'uploader_id': 'thisisfusion',
|
|
|
|
'upload_date': '20150918'
|
2016-06-30 14:57:42 +02:00
|
|
|
},
|
2016-07-02 02:44:37 +07:00
|
|
|
'params': {
|
|
|
|
'skip_download': True,
|
|
|
|
},
|
2018-10-22 19:41:17 -04:00
|
|
|
'add_ie': ['Youtube'],
|
2016-07-02 02:44:37 +07:00
|
|
|
}, {
|
2018-02-17 05:54:52 -08:00
|
|
|
'url': 'http://fusion.tv/video/201781',
|
2016-07-02 02:44:37 +07:00
|
|
|
'only_matching': True,
|
2018-10-22 19:41:17 -04:00
|
|
|
}, {
|
|
|
|
'url': 'https://fusion.tv/video/584520/dreaming-of-the-whitest-christmas/',
|
|
|
|
'info_dict': {
|
|
|
|
'id': '584520',
|
|
|
|
'ext': 'm3u8',
|
|
|
|
'title': 'Dreaming of the Whitest Christmas',
|
|
|
|
'description': 'md5:350a32da86dc05a2179c9694d9d61feb',
|
|
|
|
'release_date': '20171211',
|
|
|
|
'thumbnail': r're:http.*.jpg[?]?',
|
|
|
|
},
|
|
|
|
'params': {
|
|
|
|
'skip_download': True,
|
|
|
|
}
|
2016-07-02 02:44:37 +07:00
|
|
|
}]
|
2016-06-30 14:57:42 +02:00
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
display_id = self._match_id(url)
|
|
|
|
webpage = self._download_webpage(url, display_id)
|
|
|
|
|
2018-10-22 19:41:17 -04:00
|
|
|
fusionData = self._parse_json(
|
|
|
|
self._search_regex(
|
|
|
|
r'(?si)fusionData\s*=\s*({.*?});', webpage,
|
|
|
|
'fusionData'),
|
|
|
|
display_id)
|
|
|
|
|
|
|
|
data = fusionData.get('single')
|
|
|
|
|
|
|
|
info = {
|
|
|
|
'id': display_id,
|
|
|
|
'title': data.get('title'),
|
|
|
|
'display_id': data.get('slug'),
|
|
|
|
'description': data.get('excerpt'),
|
|
|
|
}
|
|
|
|
|
|
|
|
published = data.get('published')
|
|
|
|
if published and 'T' in published:
|
|
|
|
info['release_date'] = published.split('T')[0].replace('-', '')
|
|
|
|
|
|
|
|
if 'images' in data:
|
|
|
|
info['thumbnails'] = [{'id': image, 'url': url} for image, url in data.get('images').items()]
|
|
|
|
|
|
|
|
srcs = data.get('src')
|
|
|
|
|
|
|
|
if not srcs:
|
|
|
|
youtube_id = data.get('video_ids').get('youtube')
|
|
|
|
if not youtube_id:
|
|
|
|
raise ExtractorError('Could not find alternate youtube url')
|
|
|
|
|
|
|
|
info['_type'] = 'url'
|
|
|
|
info['url'] = youtube_id
|
|
|
|
info['ie_key'] = 'Youtube'
|
|
|
|
return info
|
|
|
|
|
|
|
|
formats = []
|
|
|
|
for format in srcs.keys():
|
|
|
|
if format not in ['m3u8-hp-v3', 'm3u8-variant', 'mp4']:
|
|
|
|
continue
|
|
|
|
|
|
|
|
for vid in srcs.get(format).values():
|
|
|
|
formats.append(
|
|
|
|
{
|
|
|
|
'url': vid.get('url'),
|
|
|
|
'width': int_or_none(vid.get('width')),
|
|
|
|
'height': int_or_none(vid.get('height')),
|
|
|
|
'format_note': vid.get('type').split('/')[1],
|
|
|
|
'protocol': 'm3u8' if format.startswith('m3u8') else None,
|
|
|
|
'quality': int_or_none(vid.get('width', 0)) * int_or_none(vid.get('height', 0))
|
|
|
|
}
|
|
|
|
)
|
2016-06-30 14:57:42 +02:00
|
|
|
|
2018-10-22 19:41:17 -04:00
|
|
|
formats.sort(key=lambda format: format['quality'])
|
|
|
|
info['formats'] = formats
|
|
|
|
return info
|