| 
									
										
										
										
											2016-01-09 15:31:50 -08:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  | import base64 | 
					
						
							|  |  |  | import re | 
					
						
							| 
									
										
										
										
											2016-01-09 15:31:50 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..compat import compat_urllib_parse_unquote | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class BigflixIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?bigflix\.com/.+/(?P<id>[0-9]+)' | 
					
						
							|  |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2016-01-09 15:31:50 -08:00
										 |  |  |         'url': 'http://www.bigflix.com/Hindi-movies/Action-movies/Singham-Returns/16537', | 
					
						
							|  |  |  |         'md5': 'ec76aa9b1129e2e5b301a474e54fab74', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '16537', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Singham Returns', | 
					
						
							|  |  |  |             'description': 'md5:3d2ba5815f14911d5cc6a501ae0cf65d', | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  |     }, { | 
					
						
							| 
									
										
										
										
											2016-01-10 10:49:27 +06:00
										 |  |  |         # 2 formats | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  |         'url': 'http://www.bigflix.com/Tamil-movies/Drama-movies/Madarasapatinam/16070', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '16070', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Madarasapatinam', | 
					
						
							|  |  |  |             'description': 'md5:63b9b8ed79189c6f0418c26d9a3452ca', | 
					
						
							|  |  |  |             'formats': 'mincount:2', | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'params': { | 
					
						
							|  |  |  |             'skip_download': True, | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2016-01-10 10:49:27 +06:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         # multiple formats | 
					
						
							|  |  |  |         'url': 'http://www.bigflix.com/Malayalam-movies/Drama-movies/Indian-Rupee/15967', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  |     }] | 
					
						
							| 
									
										
										
										
											2016-01-09 15:31:50 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         video_id = self._match_id(url) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         title = self._html_search_regex( | 
					
						
							|  |  |  |             r'<div[^>]+class=["\']pagetitle["\'][^>]*>(.+?)</div>', | 
					
						
							|  |  |  |             webpage, 'title') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  |         def decode_url(quoted_b64_url): | 
					
						
							|  |  |  |             return base64.b64decode(compat_urllib_parse_unquote( | 
					
						
							| 
									
										
										
										
											2016-01-10 10:49:27 +06:00
										 |  |  |                 quoted_b64_url).encode('ascii')).decode('utf-8') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  |         for height, encoded_url in re.findall( | 
					
						
							| 
									
										
										
										
											2016-01-10 14:26:27 +01:00
										 |  |  |                 r'ContentURL_(\d{3,4})[pP][^=]+=([^&]+)', webpage): | 
					
						
							| 
									
										
										
										
											2016-01-10 10:49:27 +06:00
										 |  |  |             video_url = decode_url(encoded_url) | 
					
						
							|  |  |  |             f = { | 
					
						
							|  |  |  |                 'url': video_url, | 
					
						
							|  |  |  |                 'format_id': '%sp' % height, | 
					
						
							|  |  |  |                 'height': int(height), | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |             if video_url.startswith('rtmp'): | 
					
						
							|  |  |  |                 f['ext'] = 'flv' | 
					
						
							|  |  |  |             formats.append(f) | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-01-10 10:49:27 +06:00
										 |  |  |         file_url = self._search_regex( | 
					
						
							|  |  |  |             r'file=([^&]+)', webpage, 'video url', default=None) | 
					
						
							|  |  |  |         if file_url: | 
					
						
							|  |  |  |             video_url = decode_url(file_url) | 
					
						
							|  |  |  |             if all(f['url'] != video_url for f in formats): | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': decode_url(file_url), | 
					
						
							|  |  |  |                 }) | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-01-10 10:49:27 +06:00
										 |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2016-01-09 15:31:50 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |         description = self._html_search_meta('description', webpage) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							| 
									
										
										
										
											2016-01-10 10:31:36 +06:00
										 |  |  |             'formats': formats | 
					
						
							| 
									
										
										
										
											2016-01-09 15:31:50 -08:00
										 |  |  |         } |