| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2015-06-09 20:36:08 +06:00
										 |  |  | from ..compat import compat_urllib_parse_urlparse | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							|  |  |  |     determine_ext, | 
					
						
							|  |  |  |     float_or_none, | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | class SpiegeltvIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-11-16 00:40:09 +01:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?spiegel\.tv/(?:#/)?filme/(?P<id>[\-a-z0-9]+)' | 
					
						
							| 
									
										
										
										
											2014-11-16 00:33:51 +01:00
										 |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  |         'url': 'http://www.spiegel.tv/filme/flug-mh370/', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': 'flug-mh370', | 
					
						
							|  |  |  |             'ext': 'm4v', | 
					
						
							|  |  |  |             'title': 'Flug MH370', | 
					
						
							|  |  |  |             'description': 'Das Rätsel um die Boeing 777 der Malaysia-Airlines', | 
					
						
							| 
									
										
										
										
											2017-01-02 20:08:07 +08:00
										 |  |  |             'thumbnail': r're:http://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2014-06-03 16:50:54 +02:00
										 |  |  |         }, | 
					
						
							|  |  |  |         'params': { | 
					
						
							| 
									
										
										
										
											2015-06-09 20:36:08 +06:00
										 |  |  |             # m3u8 download | 
					
						
							| 
									
										
										
										
											2014-06-03 16:50:54 +02:00
										 |  |  |             'skip_download': True, | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2014-11-16 00:40:09 +01:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.spiegel.tv/#/filme/alleskino-die-wahrheit-ueber-maenner/', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							| 
									
										
										
										
											2014-11-16 00:33:51 +01:00
										 |  |  |     }] | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2014-11-16 00:40:09 +01:00
										 |  |  |         if '/#/' in url: | 
					
						
							|  |  |  |             url = url.replace('/#/', '/') | 
					
						
							| 
									
										
										
										
											2014-11-16 00:33:51 +01:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  |         title = self._html_search_regex(r'<h1.*?>(.*?)</h1>', webpage, 'title') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  |         apihost = 'http://spiegeltv-ivms2-restapi.s3.amazonaws.com' | 
					
						
							|  |  |  |         version_json = self._download_json( | 
					
						
							|  |  |  |             '%s/version.json' % apihost, video_id, | 
					
						
							|  |  |  |             note='Downloading version information') | 
					
						
							|  |  |  |         version_name = version_json['version_name'] | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  |         slug_json = self._download_json( | 
					
						
							|  |  |  |             '%s/%s/restapi/slugs/%s.json' % (apihost, version_name, video_id), | 
					
						
							|  |  |  |             video_id, | 
					
						
							|  |  |  |             note='Downloading object information') | 
					
						
							|  |  |  |         oid = slug_json['object_id'] | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  |         media_json = self._download_json( | 
					
						
							|  |  |  |             '%s/%s/restapi/media/%s.json' % (apihost, version_name, oid), | 
					
						
							|  |  |  |             video_id, note='Downloading media information') | 
					
						
							|  |  |  |         uuid = media_json['uuid'] | 
					
						
							|  |  |  |         is_wide = media_json['is_wide'] | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  |         server_json = self._download_json( | 
					
						
							| 
									
										
										
										
											2015-05-30 13:23:09 +08:00
										 |  |  |             'http://spiegeltv-prod-static.s3.amazonaws.com/projectConfigs/projectConfig.json', | 
					
						
							|  |  |  |             video_id, note='Downloading server information') | 
					
						
							| 
									
										
										
										
											2015-06-09 20:36:08 +06:00
										 |  |  | 
 | 
					
						
							|  |  |  |         format = '16x9' if is_wide else '4x3' | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  |         for streamingserver in server_json['streamingserver']: | 
					
						
							|  |  |  |             endpoint = streamingserver.get('endpoint') | 
					
						
							|  |  |  |             if not endpoint: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             play_path = 'mp4:%s_spiegeltv_0500_%s.m4v' % (uuid, format) | 
					
						
							|  |  |  |             if endpoint.startswith('rtmp'): | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': endpoint, | 
					
						
							|  |  |  |                     'format_id': 'rtmp', | 
					
						
							|  |  |  |                     'app': compat_urllib_parse_urlparse(endpoint).path[1:], | 
					
						
							|  |  |  |                     'play_path': play_path, | 
					
						
							|  |  |  |                     'player_path': 'http://prod-static.spiegel.tv/frontend-076.swf', | 
					
						
							|  |  |  |                     'ext': 'flv', | 
					
						
							|  |  |  |                     'rtmp_live': True, | 
					
						
							|  |  |  |                 }) | 
					
						
							|  |  |  |             elif determine_ext(endpoint) == 'm3u8': | 
					
						
							| 
									
										
										
										
											2015-10-24 16:24:08 +06:00
										 |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': endpoint.replace('[video]', play_path), | 
					
						
							|  |  |  |                     'ext': 'm4v', | 
					
						
							|  |  |  |                     'format_id': 'hls',  # Prefer hls since it allows to workaround georestriction | 
					
						
							|  |  |  |                     'protocol': 'm3u8', | 
					
						
							|  |  |  |                     'preference': 1, | 
					
						
							|  |  |  |                     'http_headers': { | 
					
						
							| 
									
										
										
										
											2015-10-24 12:41:41 +02:00
										 |  |  |                         'Accept-Encoding': 'deflate',  # gzip causes trouble on the server side | 
					
						
							| 
									
										
										
										
											2015-10-24 16:24:08 +06:00
										 |  |  |                     }, | 
					
						
							|  |  |  |                 }) | 
					
						
							| 
									
										
										
										
											2015-06-09 20:36:08 +06:00
										 |  |  |             else: | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': endpoint, | 
					
						
							|  |  |  |                 }) | 
					
						
							| 
									
										
										
										
											2015-10-24 16:25:44 +06:00
										 |  |  |         self._check_formats(formats, video_id) | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         thumbnails = [] | 
					
						
							|  |  |  |         for image in media_json['images']: | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  |             thumbnails.append({ | 
					
						
							|  |  |  |                 'url': image['url'], | 
					
						
							|  |  |  |                 'width': image['width'], | 
					
						
							|  |  |  |                 'height': image['height'], | 
					
						
							|  |  |  |             }) | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         description = media_json['subtitle'] | 
					
						
							| 
									
										
										
										
											2014-11-16 00:33:51 +01:00
										 |  |  |         duration = float_or_none(media_json.get('duration_in_ms'), scale=1000) | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 15:33:45 +02:00
										 |  |  |         return { | 
					
						
							| 
									
										
										
										
											2014-05-30 16:35:17 +02:00
										 |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							|  |  |  |             'duration': duration, | 
					
						
							| 
									
										
										
										
											2015-05-30 13:23:09 +08:00
										 |  |  |             'thumbnails': thumbnails, | 
					
						
							| 
									
										
										
										
											2015-06-09 20:36:08 +06:00
										 |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2014-11-23 20:41:03 +01:00
										 |  |  |         } |