| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2014-11-29 22:16:35 +06:00
										 |  |  |     ExtractorError, | 
					
						
							|  |  |  |     clean_html, | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  |     compat_urllib_parse, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-03-10 20:55:47 +01:00
										 |  |  | class PlayvidIE(InfoExtractor): | 
					
						
							|  |  |  |     _VALID_URL = r'^https?://www\.playvid\.com/watch(\?v=|/)(?P<id>.+?)(?:#|$)' | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  |     _TEST = { | 
					
						
							|  |  |  |         'url': 'http://www.playvid.com/watch/agbDDi7WZTV', | 
					
						
							|  |  |  |         'md5': '44930f8afa616efdf9482daf4fe53e1e', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2014-03-10 20:55:47 +01:00
										 |  |  |             'id': 'agbDDi7WZTV', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  |             'title': 'Michelle Lewin in Miami Beach', | 
					
						
							|  |  |  |             'duration': 240, | 
					
						
							|  |  |  |             'age_limit': 18, | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         video_id = mobj.group('id') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-11-29 22:16:35 +06:00
										 |  |  |         m_error = re.search( | 
					
						
							|  |  |  |             r'<div class="block-error">\s*<div class="heading">\s*<div>(?P<msg>.+?)</div>\s*</div>', webpage) | 
					
						
							|  |  |  |         if m_error: | 
					
						
							|  |  |  |             raise ExtractorError(clean_html(m_error.group('msg')), expected=True) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  |         video_title = None | 
					
						
							|  |  |  |         duration = None | 
					
						
							|  |  |  |         video_thumbnail = None | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         # most of the information is stored in the flashvars | 
					
						
							| 
									
										
										
										
											2014-03-10 20:55:47 +01:00
										 |  |  |         flashvars = self._html_search_regex( | 
					
						
							|  |  |  |             r'flashvars="(.+?)"', webpage, 'flashvars') | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-03-10 20:55:47 +01:00
										 |  |  |         infos = compat_urllib_parse.unquote(flashvars).split(r'&') | 
					
						
							|  |  |  |         for info in infos: | 
					
						
							|  |  |  |             videovars_match = re.match(r'^video_vars\[(.+?)\]=(.+?)$', info) | 
					
						
							|  |  |  |             if videovars_match: | 
					
						
							|  |  |  |                 key = videovars_match.group(1) | 
					
						
							|  |  |  |                 val = videovars_match.group(2) | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-03-10 20:55:47 +01:00
										 |  |  |                 if key == 'title': | 
					
						
							|  |  |  |                     video_title = compat_urllib_parse.unquote_plus(val) | 
					
						
							|  |  |  |                 if key == 'duration': | 
					
						
							|  |  |  |                     try: | 
					
						
							|  |  |  |                         duration = int(val) | 
					
						
							|  |  |  |                     except ValueError: | 
					
						
							|  |  |  |                         pass | 
					
						
							|  |  |  |                 if key == 'big_thumb': | 
					
						
							|  |  |  |                     video_thumbnail = val | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-03-10 20:55:47 +01:00
										 |  |  |                 videourl_match = re.match( | 
					
						
							|  |  |  |                     r'^video_urls\]\[(?P<resolution>[0-9]+)p', key) | 
					
						
							|  |  |  |                 if videourl_match: | 
					
						
							|  |  |  |                     height = int(videourl_match.group('resolution')) | 
					
						
							|  |  |  |                     formats.append({ | 
					
						
							|  |  |  |                         'height': height, | 
					
						
							|  |  |  |                         'url': val, | 
					
						
							|  |  |  |                     }) | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2014-03-10 14:41:19 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |         # Extract title - should be in the flashvars; if not, look elsewhere | 
					
						
							|  |  |  |         if video_title is None: | 
					
						
							|  |  |  |             video_title = self._html_search_regex( | 
					
						
							|  |  |  |                 r'<title>(.*?)</title', webpage, 'title') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'formats': formats, | 
					
						
							|  |  |  |             'title': video_title, | 
					
						
							|  |  |  |             'thumbnail': video_thumbnail, | 
					
						
							|  |  |  |             'duration': duration, | 
					
						
							|  |  |  |             'description': None, | 
					
						
							|  |  |  |             'age_limit': 18 | 
					
						
							|  |  |  |         } |