| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..compat import compat_str | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							|  |  |  |     int_or_none, | 
					
						
							|  |  |  |     js_to_json, | 
					
						
							|  |  |  |     try_get, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | class JojIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |     _VALID_URL = r'''(?x)
 | 
					
						
							|  |  |  |                     (?: | 
					
						
							|  |  |  |                         joj:| | 
					
						
							|  |  |  |                         https?://media\.joj\.sk/embed/ | 
					
						
							|  |  |  |                     ) | 
					
						
							| 
									
										
										
										
											2018-06-24 23:57:22 +07:00
										 |  |  |                     (?P<id>[^/?#^]+) | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |                 '''
 | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |         'url': 'https://media.joj.sk/embed/a388ec4c-6019-4a4a-9312-b1bee194e932', | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': 'a388ec4c-6019-4a4a-9312-b1bee194e932', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |             'title': 'NOVÉ BÝVANIE', | 
					
						
							|  |  |  |             'thumbnail': r're:^https?://.*\.jpg$', | 
					
						
							|  |  |  |             'duration': 3118, | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2018-06-24 23:57:22 +07:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'https://media.joj.sk/embed/9i1cxv', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |     }, { | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |         'url': 'joj:a388ec4c-6019-4a4a-9312-b1bee194e932', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							| 
									
										
										
										
											2018-06-24 23:57:22 +07:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'joj:9i1cxv', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |     }] | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |     @staticmethod | 
					
						
							|  |  |  |     def _extract_urls(webpage): | 
					
						
							| 
									
										
										
										
											2018-06-24 23:57:22 +07:00
										 |  |  |         return [ | 
					
						
							|  |  |  |             mobj.group('url') | 
					
						
							|  |  |  |             for mobj in re.finditer( | 
					
						
							|  |  |  |                 r'<iframe\b[^>]+\bsrc=(["\'])(?P<url>(?:https?:)?//media\.joj\.sk/embed/(?:(?!\1).)+)\1', | 
					
						
							|  |  |  |                 webpage)] | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         webpage = self._download_webpage( | 
					
						
							|  |  |  |             'https://media.joj.sk/embed/%s' % video_id, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         title = self._search_regex( | 
					
						
							|  |  |  |             (r'videoTitle\s*:\s*(["\'])(?P<title>(?:(?!\1).)+)\1', | 
					
						
							|  |  |  |              r'<title>(?P<title>[^<]+)'), webpage, 'title', | 
					
						
							|  |  |  |             default=None, group='title') or self._og_search_title(webpage) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         bitrates = self._parse_json( | 
					
						
							|  |  |  |             self._search_regex( | 
					
						
							| 
									
										
										
										
											2018-11-24 16:14:27 +01:00
										 |  |  |                 r'(?s)(?:src|bitrates)\s*=\s*({.+?});', webpage, 'bitrates', | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |                 default='{}'), | 
					
						
							|  |  |  |             video_id, transform_source=js_to_json, fatal=False) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |         formats = [] | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |         for format_url in try_get(bitrates, lambda x: x['mp4'], list) or []: | 
					
						
							|  |  |  |             if isinstance(format_url, compat_str): | 
					
						
							|  |  |  |                 height = self._search_regex( | 
					
						
							|  |  |  |                     r'(\d+)[pP]\.', format_url, 'height', default=None) | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': format_url, | 
					
						
							|  |  |  |                     'format_id': '%sp' % height if height else None, | 
					
						
							|  |  |  |                     'height': int(height), | 
					
						
							|  |  |  |                 }) | 
					
						
							|  |  |  |         if not formats: | 
					
						
							|  |  |  |             playlist = self._download_xml( | 
					
						
							|  |  |  |                 'https://media.joj.sk/services/Video.php?clip=%s' % video_id, | 
					
						
							|  |  |  |                 video_id) | 
					
						
							|  |  |  |             for file_el in playlist.findall('./files/file'): | 
					
						
							|  |  |  |                 path = file_el.get('path') | 
					
						
							|  |  |  |                 if not path: | 
					
						
							|  |  |  |                     continue | 
					
						
							|  |  |  |                 format_id = file_el.get('id') or file_el.get('label') | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': 'http://n16.joj.sk/storage/%s' % path.replace( | 
					
						
							|  |  |  |                         'dat/', '', 1), | 
					
						
							|  |  |  |                     'format_id': format_id, | 
					
						
							|  |  |  |                     'height': int_or_none(self._search_regex( | 
					
						
							|  |  |  |                         r'(\d+)[pP]', format_id or path, 'height', | 
					
						
							|  |  |  |                         default=None)), | 
					
						
							|  |  |  |                 }) | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |         thumbnail = self._og_search_thumbnail(webpage) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         duration = int_or_none(self._search_regex( | 
					
						
							|  |  |  |             r'videoDuration\s*:\s*(\d+)', webpage, 'duration', fatal=False)) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							| 
									
										
										
										
											2017-07-09 19:05:18 +07:00
										 |  |  |             'title': title, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |             'duration': duration, | 
					
						
							| 
									
										
										
										
											2017-06-02 22:44:39 +02:00
										 |  |  |             'formats': formats, | 
					
						
							|  |  |  |         } |