| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  | from ..compat import ( | 
					
						
							| 
									
										
										
										
											2015-03-05 14:45:38 +02:00
										 |  |  |     compat_parse_qs, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |     compat_urllib_request, | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  | ) | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2015-03-05 14:45:38 +02:00
										 |  |  |     qualities, | 
					
						
							| 
									
										
										
										
											2014-09-27 22:36:53 +07:00
										 |  |  |     str_to_int, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | class ExtremeTubeIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?(?P<url>extremetube\.com/.*?video/.+?(?P<id>[0-9]+))(?:[/?&]|$)' | 
					
						
							| 
									
										
										
										
											2014-04-19 19:41:06 +02:00
										 |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         'url': 'http://www.extremetube.com/video/music-video-14-british-euro-brit-european-cumshots-swallow-652431', | 
					
						
							| 
									
										
										
										
											2015-03-05 14:45:38 +02:00
										 |  |  |         'md5': '344d0c6d50e2f16b06e49ca011d8ac69', | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '652431', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Music Video 14 british euro brit european cumshots swallow', | 
					
						
							|  |  |  |             'uploader': 'unknown', | 
					
						
							| 
									
										
										
										
											2014-09-27 22:36:53 +07:00
										 |  |  |             'view_count': int, | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |             'age_limit': 18, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2014-04-19 19:41:06 +02:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.extremetube.com/gay/video/abcde-1234', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  |         video_id = mobj.group('id') | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |         url = 'http://www.' + mobj.group('url') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         req = compat_urllib_request.Request(url) | 
					
						
							|  |  |  |         req.add_header('Cookie', 'age_verified=1') | 
					
						
							|  |  |  |         webpage = self._download_webpage(req, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         video_title = self._html_search_regex( | 
					
						
							| 
									
										
										
										
											2014-05-31 18:31:39 +02:00
										 |  |  |             r'<h1 [^>]*?title="([^"]+)"[^>]*>', webpage, 'title') | 
					
						
							| 
									
										
										
										
											2014-04-19 19:42:51 +02:00
										 |  |  |         uploader = self._html_search_regex( | 
					
						
							| 
									
										
										
										
											2014-09-27 22:36:53 +07:00
										 |  |  |             r'Uploaded by:\s*</strong>\s*(.+?)\s*</div>', | 
					
						
							|  |  |  |             webpage, 'uploader', fatal=False) | 
					
						
							|  |  |  |         view_count = str_to_int(self._html_search_regex( | 
					
						
							|  |  |  |             r'Views:\s*</strong>\s*<span>([\d,\.]+)</span>', | 
					
						
							|  |  |  |             webpage, 'view count', fatal=False)) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-05 14:45:38 +02:00
										 |  |  |         flash_vars = compat_parse_qs(self._search_regex( | 
					
						
							|  |  |  |             r'<param[^>]+?name="flashvars"[^>]+?value="([^"]+)"', webpage, 'flash vars')) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  |         quality = qualities(['180p', '240p', '360p', '480p', '720p', '1080p']) | 
					
						
							|  |  |  |         for k, vals in flash_vars.items(): | 
					
						
							|  |  |  |             m = re.match(r'quality_(?P<quality>[0-9]+p)$', k) | 
					
						
							|  |  |  |             if m is not None: | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'format_id': m.group('quality'), | 
					
						
							|  |  |  |                     'quality': quality(m.group('quality')), | 
					
						
							|  |  |  |                     'url': vals[0], | 
					
						
							|  |  |  |                 }) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': video_title, | 
					
						
							| 
									
										
										
										
											2015-03-05 14:45:38 +02:00
										 |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |             'uploader': uploader, | 
					
						
							| 
									
										
										
										
											2014-09-27 22:36:53 +07:00
										 |  |  |             'view_count': view_count, | 
					
						
							| 
									
										
										
										
											2013-11-02 22:33:49 +01:00
										 |  |  |             'age_limit': 18, | 
					
						
							| 
									
										
										
										
											2013-10-28 17:35:01 +01:00
										 |  |  |         } |