| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  | # encoding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  | from ..compat import ( | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  |     compat_urllib_parse, | 
					
						
							| 
									
										
										
										
											2015-06-15 18:49:27 +08:00
										 |  |  |     compat_urlparse, | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  | ) | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  |     ExtractorError, | 
					
						
							| 
									
										
										
										
											2015-11-21 22:18:17 +06:00
										 |  |  |     sanitized_Request, | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class Vbox7IE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  |     _VALID_URL = r'http://(?:www\.)?vbox7\.com/play:(?P<id>[^/]+)' | 
					
						
							| 
									
										
										
										
											2013-06-27 20:46:46 +02:00
										 |  |  |     _TEST = { | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |         'url': 'http://vbox7.com/play:249bb972c2', | 
					
						
							|  |  |  |         'md5': '99f65c0c9ef9b682b97313e052734c3f', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '249bb972c2', | 
					
						
							| 
									
										
										
										
											2014-09-27 10:53:02 +02:00
										 |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |             'title': 'Смях! Чудо - чист за секунди - Скрита камера', | 
					
						
							|  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2013-06-27 20:46:46 +02:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-06-15 18:49:27 +08:00
										 |  |  |         # need to get the page 3 times for the correct jsSecretToken cookie | 
					
						
							|  |  |  |         # which is necessary for the correct title | 
					
						
							|  |  |  |         def get_session_id(): | 
					
						
							|  |  |  |             redirect_page = self._download_webpage(url, video_id) | 
					
						
							|  |  |  |             session_id_url = self._search_regex( | 
					
						
							|  |  |  |                 r'var\s*url\s*=\s*\'([^\']+)\';', redirect_page, | 
					
						
							|  |  |  |                 'session id url') | 
					
						
							|  |  |  |             self._download_webpage( | 
					
						
							|  |  |  |                 compat_urlparse.urljoin(url, session_id_url), video_id, | 
					
						
							|  |  |  |                 'Getting session id') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         get_session_id() | 
					
						
							|  |  |  |         get_session_id() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, video_id, | 
					
						
							| 
									
										
										
										
											2014-11-23 21:39:15 +01:00
										 |  |  |                                          'Downloading redirect page') | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         title = self._html_search_regex(r'<title>(.*)</title>', | 
					
						
							| 
									
										
										
										
											2014-11-23 21:39:15 +01:00
										 |  |  |                                         webpage, 'title').split('/')[0].strip() | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         info_url = "http://vbox7.com/play/magare.do" | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |         data = compat_urllib_parse.urlencode({'as3': '1', 'vid': video_id}) | 
					
						
							| 
									
										
										
										
											2015-11-21 22:18:17 +06:00
										 |  |  |         info_request = sanitized_Request(info_url, data) | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  |         info_request.add_header('Content-Type', 'application/x-www-form-urlencoded') | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |         info_response = self._download_webpage(info_request, video_id, 'Downloading info webpage') | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  |         if info_response is None: | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |             raise ExtractorError('Unable to extract the media url') | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  |         (final_url, thumbnail_url) = map(lambda x: x.split('=')[1], info_response.split('&')) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'url': final_url, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							| 
									
										
										
										
											2013-06-23 22:25:46 +02:00
										 |  |  |             'thumbnail': thumbnail_url, | 
					
						
							| 
									
										
										
										
											2014-02-04 23:02:53 +01:00
										 |  |  |         } |