From 31fa1e92b663eb67d7f814e659b3ab3d2d7b6abd Mon Sep 17 00:00:00 2001 From: cwd24 Date: Wed, 11 Apr 2018 01:28:02 +0200 Subject: [PATCH] [senedd] add extractor for senedd.tv --- youtube_dl/extractor/extractors.py | 1 + youtube_dl/extractor/senedd.py | 63 ++++++++++++++++++++++++++++++ 2 files changed, 64 insertions(+) create mode 100644 youtube_dl/extractor/senedd.py diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py index c9f60114d..691bc3ac6 100644 --- a/youtube_dl/extractor/extractors.py +++ b/youtube_dl/extractor/extractors.py @@ -947,6 +947,7 @@ from .scrippsnetworks import ScrippsNetworksWatchIE from .seeker import SeekerIE from .senateisvp import SenateISVPIE from .sendtonews import SendtoNewsIE +from .senedd import SeneddIE from .servingsys import ServingSysIE from .servus import ServusIE from .sevenplus import SevenPlusIE diff --git a/youtube_dl/extractor/senedd.py b/youtube_dl/extractor/senedd.py new file mode 100644 index 000000000..637dd45fb --- /dev/null +++ b/youtube_dl/extractor/senedd.py @@ -0,0 +1,63 @@ +# coding: utf-8 +from __future__ import unicode_literals + +from .common import InfoExtractor +from ..utils import parse_duration +from ..compat import ( + compat_parse_qs, + compat_urllib_parse_urlparse, +) + + +class SeneddIE(InfoExtractor): + _VALID_URL = r'http://senedd\.tv/Meeting/(?:Archive|Clip)/(?P[0-9a-f\-]+)' + # TODO: some old links which redirect: http://www.senedd.tv/cy/4251?startPos=6&l=cy + _TEST = { + 'url': 'http://senedd.tv/Meeting/Clip/f2a274d3-a15a-4dec-b92b-be233eed9601?inPoint=00:50:35&outPoint=02:39:16', + # http://senedd.tv/Meeting/Archive/f2a274d3-a15a-4dec-b92b-be233eed9601?autostart=True + 'md5': '673307fe76d3c885bf02d8b146f10a2f', + 'info_dict': { + 'id': 'f2a274d3-a15a-4dec-b92b-be233eed9601', + 'ext': 'mp4', + 'title': 'Plenary', + 'thumbnail': r're:^http://.*\.jpg$', + 'language': 'en', + } + } + + def _real_extract(self, url): + video_id = self._match_id(url) + # http://player.nafw.cloud.vualto.com/Player/Index/f2a274d3-a15a-4dec-b92b-be233eed9601?autostart=True&captionsOn=False + webpage = self._download_webpage(url, video_id) + inverted_language = self._html_search_regex(r'