69 lines
2.2 KiB
Python
Raw Normal View History

2018-03-14 09:43:11 -04:00
from __future__ import unicode_literals
import re
from .common import InfoExtractor
from ..utils import (
decode_packed_codes,
ExtractorError,
2018-03-15 02:06:12 -04:00
js_to_json,
2018-03-14 09:43:11 -04:00
)
class VidtodoIE(InfoExtractor):
2018-03-19 02:05:39 -04:00
_VALID_URL = r'https?://(?:www\.)?vidt.d?.+\.(?:me|com)/(?:embed-)?(?P<id>\w+)'
2018-03-14 09:43:11 -04:00
_TESTS = [{
'url': 'https://vidtodo.me/4c8rx0tt8ek4',
2018-03-15 02:06:12 -04:00
'md5': 'cfd8415e586d59a4de942757eeb7145f',
2018-03-14 09:43:11 -04:00
'info_dict': {
'id': '4c8rx0tt8ek4',
'ext': 'mp4',
'title': 'Watch 343291981 mp4',
},
2018-03-15 02:06:12 -04:00
}, ]
_USER_AGENT = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/56.0.2924.87 Safari/537.36'
@staticmethod
def xpro(encoded_url):
decoded_url = ''
alphabet = 'abcdefghijklmnopqrstuvwxyz'
betalpha = 'nopqrstuvwxyzabcdefghijklm'
for char in encoded_url:
if char.isalpha():
decoded_url += alphabet[betalpha.find(char)]
else:
decoded_url += char
return decoded_url
2018-03-14 09:43:11 -04:00
def _real_extract(self, url):
video_id = self._match_id(url)
2018-03-15 02:06:12 -04:00
headers = {
'User-Agent': self._USER_AGENT,
'Connection': 'keep-alive',
'referer': 'https://vidtodo.com',
}
2018-03-14 09:43:11 -04:00
2018-03-15 02:06:12 -04:00
webpage = self._download_webpage('http://vidtod.me/%s' % video_id, video_id, headers=headers)
2018-03-14 09:43:11 -04:00
2018-03-15 02:06:12 -04:00
title = self._html_search_regex(r'<title>(.+?)</title>', webpage, 'title')
2018-03-14 09:43:11 -04:00
2018-03-15 02:06:12 -04:00
data = re.search(r"}\('.+\.split\('\|'\)", webpage).group(0)
2018-03-14 09:43:11 -04:00
if data:
codes = decode_packed_codes(data)
else:
raise ExtractorError('File not found', expected=True, video_id=video_id)
2018-03-15 02:06:12 -04:00
source = self._search_regex(r'setup\(([^)].+\.jpg\")', codes, 'jwplayer data', fatal=False) + '}'
encoded_url = self._search_regex(r'xpro\((.+?)\)', source, 'encoded url', fatal=False)
if encoded_url:
source = source.replace('xpro(' + encoded_url + ')', self.xpro(encoded_url))
2018-03-14 09:43:11 -04:00
2018-03-15 02:06:12 -04:00
jwplayer_data = self._parse_json(source, video_id, transform_source=js_to_json)
2018-03-14 09:43:11 -04:00
2018-03-15 02:06:12 -04:00
info_dict = self._parse_jwplayer_data(jwplayer_data, video_id, require_title=False)
info_dict['title'] = title
return info_dict