| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-12-07 22:02:45 +06:00
										 |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  | from ..compat import compat_urlparse | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |     determine_ext, | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |     ExtractorError, | 
					
						
							|  |  |  |     int_or_none, | 
					
						
							|  |  |  |     xpath_text, | 
					
						
							| 
									
										
										
										
											2015-03-08 18:09:47 +06:00
										 |  |  |     qualities, | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class PladformIE(InfoExtractor): | 
					
						
							|  |  |  |     _VALID_URL = r'''(?x)
 | 
					
						
							|  |  |  |                     https?:// | 
					
						
							|  |  |  |                         (?: | 
					
						
							|  |  |  |                             (?: | 
					
						
							|  |  |  |                                 out\.pladform\.ru/player| | 
					
						
							|  |  |  |                                 static\.pladform\.ru/player\.swf | 
					
						
							|  |  |  |                             ) | 
					
						
							|  |  |  |                             \?.*\bvideoid=| | 
					
						
							|  |  |  |                             video\.pladform\.ru/catalog/video/videoid/ | 
					
						
							|  |  |  |                         ) | 
					
						
							|  |  |  |                         (?P<id>\d+) | 
					
						
							|  |  |  |                     '''
 | 
					
						
							|  |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |         'url': 'https://out.pladform.ru/player?pl=64471&videoid=3777899&vk_puid15=0&vk_puid34=0', | 
					
						
							|  |  |  |         'md5': '53362fac3a27352da20fa2803cc5cd6f', | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |             'id': '3777899', | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |             'title': 'СТУДИЯ СОЮЗ • Шоу Студия Союз, 24 выпуск (01.02.2018) Нурлан Сабуров и Слава Комиссаренко', | 
					
						
							|  |  |  |             'description': 'md5:05140e8bf1b7e2d46e7ba140be57fd95', | 
					
						
							| 
									
										
										
										
											2017-01-02 20:08:07 +08:00
										 |  |  |             'thumbnail': r're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |             'duration': 3190, | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |         }, | 
					
						
							|  |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://static.pladform.ru/player.swf?pl=21469&videoid=100183293&vkcid=0', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://video.pladform.ru/catalog/video/videoid/100183293/vkcid/0', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }] | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-12-07 22:02:45 +06:00
										 |  |  |     @staticmethod | 
					
						
							|  |  |  |     def _extract_url(webpage): | 
					
						
							|  |  |  |         mobj = re.search( | 
					
						
							| 
									
										
										
										
											2016-06-30 23:19:29 +07:00
										 |  |  |             r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//out\.pladform\.ru/player\?.+?)\1', webpage) | 
					
						
							| 
									
										
										
										
											2015-12-07 22:02:45 +06:00
										 |  |  |         if mobj: | 
					
						
							|  |  |  |             return mobj.group('url') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         video_id = self._match_id(url) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |         qs = compat_urlparse.parse_qs(compat_urlparse.urlparse(url).query) | 
					
						
							|  |  |  |         pl = qs.get('pl', ['1'])[0] | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |         video = self._download_xml( | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |             'http://out.pladform.ru/getVideo', video_id, query={ | 
					
						
							|  |  |  |                 'pl': pl, | 
					
						
							|  |  |  |                 'videoid': video_id, | 
					
						
							|  |  |  |             }) | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |         def fail(text): | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |             raise ExtractorError( | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |                 '%s returned error: %s' % (self.IE_NAME, text), | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |                 expected=True) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |         if video.tag == 'error': | 
					
						
							|  |  |  |             fail(video.text) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-08 18:09:47 +06:00
										 |  |  |         quality = qualities(('ld', 'sd', 'hd')) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-02 03:07:30 +07:00
										 |  |  |         formats = [] | 
					
						
							|  |  |  |         for src in video.findall('./src'): | 
					
						
							|  |  |  |             if src is None: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             format_url = src.text | 
					
						
							|  |  |  |             if not format_url: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             if src.get('type') == 'hls' or determine_ext(format_url) == 'm3u8': | 
					
						
							|  |  |  |                 formats.extend(self._extract_m3u8_formats( | 
					
						
							|  |  |  |                     format_url, video_id, 'mp4', entry_protocol='m3u8_native', | 
					
						
							|  |  |  |                     m3u8_id='hls', fatal=False)) | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': src.text, | 
					
						
							|  |  |  |                     'format_id': src.get('quality'), | 
					
						
							|  |  |  |                     'quality': quality(src.get('quality')), | 
					
						
							|  |  |  |                 }) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if not formats: | 
					
						
							|  |  |  |             error = xpath_text(video, './cap', 'error', default=None) | 
					
						
							|  |  |  |             if error: | 
					
						
							|  |  |  |                 fail(error) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-08 18:03:12 +06:00
										 |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         webpage = self._download_webpage( | 
					
						
							|  |  |  |             'http://video.pladform.ru/catalog/video/videoid/%s' % video_id, | 
					
						
							|  |  |  |             video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         title = self._og_search_title(webpage, fatal=False) or xpath_text( | 
					
						
							|  |  |  |             video, './/title', 'title', fatal=True) | 
					
						
							|  |  |  |         description = self._search_regex( | 
					
						
							|  |  |  |             r'</h3>\s*<p>([^<]+)</p>', webpage, 'description', fatal=False) | 
					
						
							|  |  |  |         thumbnail = self._og_search_thumbnail(webpage) or xpath_text( | 
					
						
							|  |  |  |             video, './/cover', 'cover') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         duration = int_or_none(xpath_text(video, './/time', 'duration')) | 
					
						
							|  |  |  |         age_limit = int_or_none(xpath_text(video, './/age18', 'age limit')) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |             'duration': duration, | 
					
						
							|  |  |  |             'age_limit': age_limit, | 
					
						
							|  |  |  |             'formats': formats, | 
					
						
							|  |  |  |         } |