54 lines
2.0 KiB
Python
Raw Normal View History

2018-09-06 15:41:07 +02:00
from __future__ import unicode_literals
import re
from .common import InfoExtractor
class WWEIE(InfoExtractor):
_VALID_URL = r'https?://(?:\w+\.)?wwe.com/(?:.*/)?videos/(?P<id>[\w-]+)'
_TESTS = [{
'url': 'https://www.wwe.com/videos/daniel-bryan-vs-andrade-cien-almas-smackdown-live-sept-4-2018',
'info_dict': {
'id': 'sd994_bryan_almas_090418',
'ext': 'mp4',
'title': 'Daniel Bryan vs. Andrade "Cien" Almas: SmackDown LIVE, Sept. 4, 2018',
'description': 'Still fuming after he and his wife Brie Bella were attacked by The Miz and Maryse last week, Daniel Bryan takes care of some unfinished business with Andrade "Cien" Almas.',
'thumbnail': 'https://www.wwe.com/f/styles/wwe_16_9_s/public/2018/09/20180904_sd_danielalmas--d97661dd31eea8a99837a3dbc7121f8f.jpg',
}
}, {
'url': 'https://de.wwe.com/videos/gran-metalik-vs-tony-nese-wwe-205-live-sept-4-2018',
'only_matching': True,
}]
def _real_extract(self, url):
display_id = self._match_id(url)
webpage = self._download_webpage(url, display_id)
drupal_settings = self._parse_json(
self._html_search_regex(
r'(?s)Drupal\.settings\s*,\s*({.+?})\);',
webpage, 'drupal settings'),
display_id)
player = drupal_settings['WWEVideoLanding']['initialVideo']
metadata = player['playlist'][0]
title = metadata.get('title')
video_url = 'https:' + metadata.get('file')
thumbnail = 'https://www.wwe.com' + metadata.get('image')
description = metadata.get('description')
id = re.split('[/.]', video_url)[-2]
formats = self._extract_m3u8_formats(video_url, id, 'mp4')
return {
'id': id,
'title': title,
'formats': formats,
'url': video_url,
'display_id': display_id,
'thumbnail': thumbnail,
'description': description,
}