| 
									
										
										
										
											2016-09-30 20:06:08 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							| 
									
										
										
										
											2013-07-13 09:17:48 +05:00
										 |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-07-13 09:17:48 +05:00
										 |  |  | 
 | 
					
						
							|  |  |  | class CriterionIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2016-09-08 18:29:05 +07:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?criterion\.com/films/(?P<id>[0-9]+)-.+' | 
					
						
							| 
									
										
										
										
											2013-07-13 09:18:03 +05:00
										 |  |  |     _TEST = { | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  |         'url': 'http://www.criterion.com/films/184-le-samourai', | 
					
						
							|  |  |  |         'md5': 'bc51beba55685509883a9a7830919ec3', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '184', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Le Samouraï', | 
					
						
							|  |  |  |             'description': 'md5:a2b4b116326558149bef81f76dcbb93f', | 
					
						
							| 
									
										
										
										
											2017-01-02 20:08:07 +08:00
										 |  |  |             'thumbnail': r're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2013-07-13 09:18:03 +05:00
										 |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2013-07-13 09:17:48 +05:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2016-09-30 20:06:08 +02:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2013-07-13 09:17:48 +05:00
										 |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  |         final_url = self._search_regex( | 
					
						
							| 
									
										
										
										
											2016-09-30 20:06:08 +02:00
										 |  |  |             r'so\.addVariable\("videoURL", "(.+?)"\)\;', webpage, 'video url') | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  |         title = self._og_search_title(webpage) | 
					
						
							| 
									
										
										
										
											2015-10-14 14:13:53 +01:00
										 |  |  |         description = self._html_search_meta('description', webpage) | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  |         thumbnail = self._search_regex( | 
					
						
							| 
									
										
										
										
											2016-09-30 20:06:08 +02:00
										 |  |  |             r'so\.addVariable\("thumbnailURL", "(.+?)"\)\;', | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  |             webpage, 'thumbnail url') | 
					
						
							| 
									
										
										
										
											2013-07-13 09:17:48 +05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-11 13:21:32 +02:00
										 |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'url': final_url, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |         } |