| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  | import re | 
					
						
							|  |  |  | import json | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  | from ..compat import ( | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |     compat_urlparse, | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  | ) | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |     clean_html, | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  |     get_element_by_id, | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  | class VeeHDIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2013-12-04 20:34:47 +07:00
										 |  |  |     _VALID_URL = r'https?://veehd\.com/video/(?P<id>\d+)' | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     _TEST = { | 
					
						
							| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  |         'url': 'http://veehd.com/video/4686958', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2014-08-28 01:37:57 +02:00
										 |  |  |             'id': '4686958', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  |             'title': 'Time Lapse View from Space ( ISS)', | 
					
						
							|  |  |  |             'uploader_id': 'spotted', | 
					
						
							|  |  |  |             'description': 'md5:f0094c4cf3a72e22bc4e4239ef767ad7', | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |         }, | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2014-12-13 12:24:42 +01:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  |         # VeeHD seems to send garbage on the first request. | 
					
						
							|  |  |  |         # See https://github.com/rg3/youtube-dl/issues/2102 | 
					
						
							|  |  |  |         self._download_webpage(url, video_id, 'Requesting webpage') | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  |         player_path = self._search_regex( | 
					
						
							|  |  |  |             r'\$\("#playeriframe"\).attr\({src : "(.+?)"', | 
					
						
							|  |  |  |             webpage, 'player path') | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |         player_url = compat_urlparse.urljoin(url, player_path) | 
					
						
							| 
									
										
										
										
											2014-01-06 12:54:01 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |         self._download_webpage(player_url, video_id, 'Requesting player page') | 
					
						
							|  |  |  |         player_page = self._download_webpage( | 
					
						
							|  |  |  |             player_url, video_id, 'Downloading player page') | 
					
						
							|  |  |  |         config_json = self._search_regex( | 
					
						
							|  |  |  |             r'value=\'config=({.+?})\'', player_page, 'config json') | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |         config = json.loads(config_json) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         video_url = compat_urlparse.unquote(config['clip']['url']) | 
					
						
							|  |  |  |         title = clean_html(get_element_by_id('videoName', webpage).rpartition('|')[0]) | 
					
						
							|  |  |  |         uploader_id = self._html_search_regex(r'<a href="/profile/\d+">(.+?)</a>', | 
					
						
							| 
									
										
										
										
											2014-11-23 21:39:15 +01:00
										 |  |  |                                               webpage, 'uploader') | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |         thumbnail = self._search_regex(r'<img id="veehdpreview" src="(.+?)"', | 
					
						
							| 
									
										
										
										
											2014-11-23 21:39:15 +01:00
										 |  |  |                                        webpage, 'thumbnail') | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  |         description = self._html_search_regex(r'<td class="infodropdown".*?<div>(.*?)<ul', | 
					
						
							| 
									
										
										
										
											2014-11-23 21:39:15 +01:00
										 |  |  |                                               webpage, 'description', flags=re.DOTALL) | 
					
						
							| 
									
										
										
										
											2013-09-02 11:54:09 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             '_type': 'video', | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'url': video_url, | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'uploader_id': uploader_id, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							|  |  |  |         } |