| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | # coding: utf-8 | 
					
						
							|  |  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | import re | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | from ..compat import compat_urlparse | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |     js_to_json, | 
					
						
							| 
									
										
										
										
											2015-05-22 00:45:33 +06:00
										 |  |  |  |     unified_strdate, | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | ) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | class SportBoxIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2015-05-15 16:52:11 +04:00
										 |  |  |  |     _VALID_URL = r'https?://news\.sportbox\.ru/(?:[^/]+/)+spbvideo_NI\d+_(?P<display_id>.+)' | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |     _TESTS = [{ | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/Vidy_sporta/Avtosport/Rossijskij/spbvideo_NI483529_Gonka-2-zaezd-Obyedinenniy-2000-klassi-Turing-i-S', | 
					
						
							|  |  |  |  |         'md5': 'ff56a598c2cf411a9a38a69709e97079', | 
					
						
							|  |  |  |  |         'info_dict': { | 
					
						
							|  |  |  |  |             'id': '80822', | 
					
						
							|  |  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |  |             'title': 'Гонка 2  заезд ««Объединенный 2000»: классы Туринг и Супер-продакшн', | 
					
						
							| 
									
										
										
										
											2015-05-22 00:45:33 +06:00
										 |  |  |  |             'description': 'md5:3d72dc4a006ab6805d82f037fdc637ad', | 
					
						
							| 
									
										
										
										
											2017-01-02 20:08:07 +08:00
										 |  |  |  |             'thumbnail': r're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |             'upload_date': '20140928', | 
					
						
							| 
									
										
										
										
											2015-05-15 19:57:54 +04:00
										 |  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |         'params': { | 
					
						
							|  |  |  |  |             # m3u8 download | 
					
						
							|  |  |  |  |             'skip_download': True, | 
					
						
							|  |  |  |  |         }, | 
					
						
							|  |  |  |  |     }, { | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/Vidy_sporta/billiard/spbvideo_NI486287_CHempionat-mira-po-dinamichnoy-piramide-4', | 
					
						
							|  |  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |  |     }, { | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/video/no_ads/spbvideo_NI536574_V_Novorossijske_proshel_detskij_turnir_Pole_slavy_bojevoj?ci=211355', | 
					
						
							|  |  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |  |         display_id = mobj.group('display_id') | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         webpage = self._download_webpage(url, display_id) | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |         player = self._search_regex( | 
					
						
							|  |  |  |  |             r'src="/?(vdl/player/[^"]+)"', webpage, 'player') | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |         title = self._html_search_regex( | 
					
						
							| 
									
										
										
										
											2015-05-22 00:45:33 +06:00
										 |  |  |  |             [r'"nodetitle"\s*:\s*"([^"]+)"', r'class="node-header_{1,2}title">([^<]+)'], | 
					
						
							|  |  |  |  |             webpage, 'title') | 
					
						
							|  |  |  |  |         description = self._og_search_description(webpage) or self._html_search_meta( | 
					
						
							|  |  |  |  |             'description', webpage, 'description') | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  |         thumbnail = self._og_search_thumbnail(webpage) | 
					
						
							| 
									
										
										
										
											2015-05-22 00:45:33 +06:00
										 |  |  |  |         upload_date = unified_strdate(self._html_search_meta( | 
					
						
							|  |  |  |  |             'dateCreated', webpage, 'upload date')) | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |         return { | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |             '_type': 'url_transparent', | 
					
						
							|  |  |  |  |             'url': compat_urlparse.urljoin(url, '/%s' % player), | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  |             'display_id': display_id, | 
					
						
							|  |  |  |  |             'title': title, | 
					
						
							|  |  |  |  |             'description': description, | 
					
						
							|  |  |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2015-05-22 00:45:33 +06:00
										 |  |  |  |             'upload_date': upload_date, | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |         } | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | class SportBoxEmbedIE(InfoExtractor): | 
					
						
							|  |  |  |  |     _VALID_URL = r'https?://news\.sportbox\.ru/vdl/player(?:/[^/]+/|\?.*?\bn?id=)(?P<id>\d+)' | 
					
						
							|  |  |  |  |     _TESTS = [{ | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/vdl/player/ci/211355', | 
					
						
							|  |  |  |  |         'info_dict': { | 
					
						
							|  |  |  |  |             'id': '211355', | 
					
						
							|  |  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |  |             'title': 'В Новороссийске прошел детский турнир «Поле славы боевой»', | 
					
						
							| 
									
										
										
										
											2017-01-02 20:08:07 +08:00
										 |  |  |  |             'thumbnail': r're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |         }, | 
					
						
							|  |  |  |  |         'params': { | 
					
						
							|  |  |  |  |             # m3u8 download | 
					
						
							|  |  |  |  |             'skip_download': True, | 
					
						
							|  |  |  |  |         }, | 
					
						
							|  |  |  |  |     }, { | 
					
						
							|  |  |  |  |         'url': 'http://news.sportbox.ru/vdl/player?nid=370908&only_player=1&autostart=false&playeri=2&height=340&width=580', | 
					
						
							|  |  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |  |     }] | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-15 23:08:44 +06:00
										 |  |  |  |     @staticmethod | 
					
						
							|  |  |  |  |     def _extract_urls(webpage): | 
					
						
							|  |  |  |  |         return re.findall( | 
					
						
							|  |  |  |  |             r'<iframe[^>]+src="(https?://news\.sportbox\.ru/vdl/player[^"]+)"', | 
					
						
							|  |  |  |  |             webpage) | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |  |         video_id = self._match_id(url) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         formats = [] | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         def cleanup_js(code): | 
					
						
							|  |  |  |  |             # desktop_advert_config contains complex Javascripts and we don't need it | 
					
						
							|  |  |  |  |             return js_to_json(re.sub(r'desktop_advert_config.*', '', code)) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         jwplayer_data = self._parse_json(self._search_regex( | 
					
						
							|  |  |  |  |             r'(?s)player\.setup\(({.+?})\);', webpage, 'jwplayer settings'), video_id, | 
					
						
							|  |  |  |  |             transform_source=cleanup_js) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         hls_url = jwplayer_data.get('hls_url') | 
					
						
							|  |  |  |  |         if hls_url: | 
					
						
							|  |  |  |  |             formats.extend(self._extract_m3u8_formats( | 
					
						
							|  |  |  |  |                 hls_url, video_id, ext='mp4', m3u8_id='hls')) | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         rtsp_url = jwplayer_data.get('rtsp_url') | 
					
						
							|  |  |  |  |         if rtsp_url: | 
					
						
							|  |  |  |  |             formats.append({ | 
					
						
							|  |  |  |  |                 'url': rtsp_url, | 
					
						
							|  |  |  |  |                 'format_id': 'rtsp', | 
					
						
							|  |  |  |  |             }) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-04-16 16:13:14 +08:00
										 |  |  |  |         title = jwplayer_data['node_title'] | 
					
						
							|  |  |  |  |         thumbnail = jwplayer_data.get('image_url') | 
					
						
							| 
									
										
										
										
											2015-05-15 22:50:44 +06:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  |         return { | 
					
						
							|  |  |  |  |             'id': video_id, | 
					
						
							|  |  |  |  |             'title': title, | 
					
						
							|  |  |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2014-10-09 21:05:39 +07:00
										 |  |  |  |             'formats': formats, | 
					
						
							|  |  |  |  |         } |