# coding: utf-8 from __future__ import unicode_literals from .common import InfoExtractor from ..utils import parse_duration from ..compat import ( compat_parse_qs, compat_urllib_parse_urlparse, ) class SeneddIE(InfoExtractor): _VALID_URL = r'http://senedd\.tv/Meeting/(?:Archive|Clip)/(?P[0-9a-f\-]+)' # TODO: some old links which redirect: http://www.senedd.tv/cy/4251?startPos=6&l=cy _TEST = { 'url': 'http://senedd.tv/Meeting/Clip/f2a274d3-a15a-4dec-b92b-be233eed9601?inPoint=00:50:35&outPoint=02:39:16', # http://senedd.tv/Meeting/Archive/f2a274d3-a15a-4dec-b92b-be233eed9601?autostart=True 'md5': '673307fe76d3c885bf02d8b146f10a2f', 'info_dict': { 'id': 'f2a274d3-a15a-4dec-b92b-be233eed9601', 'ext': 'mp4', 'title': 'Plenary', 'thumbnail': r're:^http://.*\.jpg$', 'language': 'en', } } def _real_extract(self, url): video_id = self._match_id(url) # http://player.nafw.cloud.vualto.com/Player/Index/f2a274d3-a15a-4dec-b92b-be233eed9601?autostart=True&captionsOn=False webpage = self._download_webpage(url, video_id) inverted_language = self._html_search_regex(r'