| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							|  |  |  |     compat_urllib_parse_urlparse, | 
					
						
							|  |  |  |     compat_urllib_request, | 
					
						
							|  |  |  |     compat_urllib_parse, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | class ExtremeTubeIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-04-19 00:29:42 +02:00
										 |  |  |     _VALID_URL = r'^(?:https?://)?(?:www\.)?(?P<url>extremetube\.com/.*?video/.+?(?P<videoid>[0-9]+))(?:[/?&]|$)' | 
					
						
							| 
									
										
										
										
											2014-04-19 19:41:06 +02:00
										 |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         'url': 'http://www.extremetube.com/video/music-video-14-british-euro-brit-european-cumshots-swallow-652431', | 
					
						
							|  |  |  |         'md5': '1fb9228f5e3332ec8c057d6ac36f33e0', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '652431', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Music Video 14 british euro brit european cumshots swallow', | 
					
						
							|  |  |  |             'uploader': 'unknown', | 
					
						
							|  |  |  |             'age_limit': 18, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2014-04-19 19:41:06 +02:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.extremetube.com/gay/video/abcde-1234', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         video_id = mobj.group('videoid') | 
					
						
							|  |  |  |         url = 'http://www.' + mobj.group('url') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         req = compat_urllib_request.Request(url) | 
					
						
							|  |  |  |         req.add_header('Cookie', 'age_verified=1') | 
					
						
							|  |  |  |         webpage = self._download_webpage(req, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         video_title = self._html_search_regex( | 
					
						
							| 
									
										
										
										
											2014-05-31 18:31:39 +02:00
										 |  |  |             r'<h1 [^>]*?title="([^"]+)"[^>]*>', webpage, 'title') | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         uploader = self._html_search_regex( | 
					
						
							|  |  |  |             r'>Posted by:(?=<)(?:\s|<[^>]*>)*(.+?)\|', webpage, 'uploader', | 
					
						
							|  |  |  |             fatal=False) | 
					
						
							|  |  |  |         video_url = compat_urllib_parse.unquote(self._html_search_regex( | 
					
						
							|  |  |  |             r'video_url=(.+?)&', webpage, 'video_url')) | 
					
						
							| 
									
										
										
										
											2013-11-03 14:03:17 +01:00
										 |  |  |         path = compat_urllib_parse_urlparse(video_url).path | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |         format = path.split('/')[5].split('_')[:2] | 
					
						
							| 
									
										
										
										
											2013-11-03 14:03:17 +01:00
										 |  |  |         format = "-".join(format) | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': video_title, | 
					
						
							|  |  |  |             'uploader': uploader, | 
					
						
							|  |  |  |             'url': video_url, | 
					
						
							|  |  |  |             'format': format, | 
					
						
							|  |  |  |             'format_id': format, | 
					
						
							| 
									
										
										
										
											2013-11-02 22:33:49 +01:00
										 |  |  |             'age_limit': 18, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |         } |