| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | # coding: utf-8 | 
					
						
							|  |  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | import re | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2017-02-05 13:36:52 +07:00
										 |  |  |  | from ..utils import js_to_json | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | class SportBoxEmbedIE(InfoExtractor): | 
					
						
							|  |  |  |  |     _VALID_URL = r'https?://news\.sportbox\.ru/vdl/player(?:/[^/]+/|\?.*?\bn?id=)(?P<id>\d+)' | 
					
						
							|  |  |  |  |     _TESTS = [{ | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/vdl/player/ci/211355', | 
					
						
							|  |  |  |  |         'info_dict': { | 
					
						
							|  |  |  |  |             'id': '211355', | 
					
						
							|  |  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |  |             'title': 'В Новороссийске прошел детский турнир «Поле славы боевой»', | 
					
						
							| 
									
										
										
										
											2017-01-02 20:08:07 +08:00
										 |  |  |  |             'thumbnail': r're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |         }, | 
					
						
							|  |  |  |  |         'params': { | 
					
						
							|  |  |  |  |             # m3u8 download | 
					
						
							|  |  |  |  |             'skip_download': True, | 
					
						
							|  |  |  |  |         }, | 
					
						
							|  |  |  |  |     }, { | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/vdl/player?nid=370908&only_player=1&autostart=false&playeri=2&height=340&width=580', | 
					
						
							|  |  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |  |     }] | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-15 23:08:44 +06:00
										 |  |  |  |     @staticmethod | 
					
						
							|  |  |  |  |     def _extract_urls(webpage): | 
					
						
							|  |  |  |  |         return re.findall( | 
					
						
							|  |  |  |  |             r'<iframe[^>]+src="(https?://news\.sportbox\.ru/vdl/player[^"]+)"', | 
					
						
							|  |  |  |  |             webpage) | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |  |         video_id = self._match_id(url) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         formats = [] | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         def cleanup_js(code): | 
					
						
							|  |  |  |  |             # desktop_advert_config contains complex Javascripts and we don't need it | 
					
						
							|  |  |  |  |             return js_to_json(re.sub(r'desktop_advert_config.*', '', code)) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         jwplayer_data = self._parse_json(self._search_regex( | 
					
						
							|  |  |  |  |             r'(?s)player\.setup\(({.+?})\);', webpage, 'jwplayer settings'), video_id, | 
					
						
							|  |  |  |  |             transform_source=cleanup_js) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         hls_url = jwplayer_data.get('hls_url') | 
					
						
							|  |  |  |  |         if hls_url: | 
					
						
							|  |  |  |  |             formats.extend(self._extract_m3u8_formats( | 
					
						
							|  |  |  |  |                 hls_url, video_id, ext='mp4', m3u8_id='hls')) | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         rtsp_url = jwplayer_data.get('rtsp_url') | 
					
						
							|  |  |  |  |         if rtsp_url: | 
					
						
							|  |  |  |  |             formats.append({ | 
					
						
							|  |  |  |  |                 'url': rtsp_url, | 
					
						
							|  |  |  |  |                 'format_id': 'rtsp', | 
					
						
							|  |  |  |  |             }) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         title = jwplayer_data['node_title'] | 
					
						
							|  |  |  |  |         thumbnail = jwplayer_data.get('image_url') | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |         return { | 
					
						
							|  |  |  |  |             'id': video_id, | 
					
						
							|  |  |  |  |             'title': title, | 
					
						
							|  |  |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  |             'formats': formats, | 
					
						
							|  |  |  |  |         } |