From 4555a88fd71693b70241e6e43875316542484060 Mon Sep 17 00:00:00 2001 From: fnord Date: Mon, 13 Jul 2015 12:02:34 -0500 Subject: [PATCH] Generic: Eliminate redundant iframe/embed src regexp matching and extractor._VALID_URL duplication --- youtube_dl/extractor/generic.py | 213 -------------------------------- 1 file changed, 213 deletions(-) diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py index ac94dcd39..0649ec1fe 100644 --- a/youtube_dl/extractor/generic.py +++ b/youtube_dl/extractor/generic.py @@ -1217,17 +1217,6 @@ class GenericIE(InfoExtractor): 'entries': entries, } - # Look for embedded rtl.nl player - matches = re.findall( - r']+?src="((?:https?:)?//(?:www\.)?rtl\.nl/system/videoplayer/[^"]+(?:video_)?embed[^"]+)"', - webpage) - if matches: - return _playlist_from_matches(matches, ie='RtlNl') - - vimeo_url = VimeoIE._extract_vimeo_url(url, webpage) - if vimeo_url is not None: - return self.url_result(vimeo_url) - # Look for embedded YouTube player matches = re.findall(r'''(?x) (?: @@ -1251,13 +1240,6 @@ class GenericIE(InfoExtractor): if matches: return _playlist_from_matches(matches, lambda m: unescapeHTML(m)) - # Look for embedded Dailymotion player - matches = re.findall( - r']+?src=(["\'])(?P(?:https?:)?//(?:www\.)?dailymotion\.com/embed/video/.+?)\1', webpage) - if matches: - return _playlist_from_matches( - matches, lambda m: unescapeHTML(m[1])) - # Look for embedded Dailymotion playlist player (#3822) m = re.search( r']+?src=(["\'])(?P(?:https?:)?//(?:www\.)?dailymotion\.[a-z]{2,3}/widget/jukebox\?.+?)\1', webpage) @@ -1299,11 +1281,6 @@ class GenericIE(InfoExtractor): if bliptv_url: return self.url_result(bliptv_url, 'BlipTV') - # Look for SVT player - svt_url = SVTIE._extract_url(webpage) - if svt_url: - return self.url_result(svt_url, 'SVT') - # Look for embedded condenast player matches = re.findall( r']+?src=(["\'])(?P(?:https?:)?//(?:cache\.)?vevo\.com/.+?)\1', webpage) - if mobj is not None: - return self.url_result(mobj.group('url')) - # Look for embedded Viddler player mobj = re.search( r'<(?:iframe[^>]+?src|param[^>]+?value)=(["\'])(?P(?:https?:)?//(?:www\.)?viddler\.com/(?:embed|player)/.+?)\1', @@ -1340,19 +1311,6 @@ class GenericIE(InfoExtractor): if mobj is not None: return self.url_result(mobj.group('url')) - # Look for NYTimes player - mobj = re.search( - r']+src=(["\'])(?P(?:https?:)?//graphics8\.nytimes\.com/bcvideo/[^/]+/iframe/embed\.html.+?)\1>', - webpage) - if mobj is not None: - return self.url_result(mobj.group('url')) - - # Look for Libsyn player - mobj = re.search( - r']+src=(["\'])(?P(?:https?:)?//html5-player\.libsyn\.com/embed/.+?)\1', webpage) - if mobj is not None: - return self.url_result(mobj.group('url')) - # Look for Ooyala videos mobj = (re.search(r'player\.ooyala\.com/[^"?]+\?[^"]*?(?:embedCode|ec)=(?P[^"&]+)', webpage) or re.search(r'OO\.Player\.create\([\'"].*?[\'"],\s*[\'"](?P.{32})[\'"]', webpage) or @@ -1369,16 +1327,6 @@ class GenericIE(InfoExtractor): return _playlist_from_matches( embeds, getter=lambda v: OoyalaIE._url_for_embed_code(v['provider_video_id']), ie='Ooyala') - # Look for Aparat videos - mobj = re.search(r'