57 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
		
		
			
		
	
	
			57 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
|  | # -*- coding: utf-8 -*- | ||
|  | from __future__ import unicode_literals | ||
|  | 
 | ||
|  | import json | ||
|  | import re | ||
|  | from .common import InfoExtractor | ||
|  | from ..utils import ( | ||
|  |     js_to_json, | ||
|  |     remove_end, | ||
|  | ) | ||
|  | 
 | ||
|  | 
 | ||
|  | class SBSIE(InfoExtractor): | ||
|  |     IE_DESC = 'sbs.com.au' | ||
|  |     _VALID_URL = r'https?://(?:www\.)?sbs\.com\.au/ondemand/video/single/(?P<id>[0-9]+)/' | ||
|  | 
 | ||
|  |     _TESTS = [{ | ||
|  |         # Original URL is handled by the generic IE which finds the iframe: | ||
|  |         # http://www.sbs.com.au/thefeed/blog/2014/08/21/dingo-conservation | ||
|  |         'url': 'http://www.sbs.com.au/ondemand/video/single/320403011771/?source=drupal&vertical=thefeed', | ||
|  |         'md5': '3150cf278965eeabb5b4cea1c963fe0a', | ||
|  |         'info_dict': { | ||
|  |             'id': '320403011771', | ||
|  |             'ext': 'flv', | ||
|  |             'title': 'Dingo Conservation', | ||
|  |             'description': 'Dingoes are on the brink of extinction; most of the animals we think are dingoes are in fact crossbred with wild dogs. This family run a dingo conservation park to prevent their extinction', | ||
|  |             'thumbnail': 're:http://.*\.jpg', | ||
|  |         }, | ||
|  |         'add_ies': ['generic'], | ||
|  |     }] | ||
|  | 
 | ||
|  |     def _real_extract(self, url): | ||
|  |         mobj = re.match(self._VALID_URL, url) | ||
|  |         video_id = mobj.group('id') | ||
|  |         webpage = self._download_webpage(url, video_id) | ||
|  | 
 | ||
|  |         release_urls_json = js_to_json(self._search_regex( | ||
|  |             r'(?s)playerParams\.releaseUrls\s*=\s*(\{.*?\n\});\n', | ||
|  |             webpage, '')) | ||
|  |         release_urls = json.loads(release_urls_json) | ||
|  |         theplatform_url = ( | ||
|  |             release_urls.get('progressive') or release_urls.get('standard')) | ||
|  | 
 | ||
|  |         title = remove_end(self._og_search_title(webpage), ' (The Feed)') | ||
|  |         description = self._html_search_meta('description', webpage) | ||
|  |         thumbnail = self._og_search_thumbnail(webpage) | ||
|  | 
 | ||
|  |         return { | ||
|  |             '_type': 'url_transparent', | ||
|  |             'id': video_id, | ||
|  |             'url': theplatform_url, | ||
|  | 
 | ||
|  |             'title': title, | ||
|  |             'description': description, | ||
|  |             'thumbnail': thumbnail, | ||
|  |         } |