| 
									
										
										
										
											2016-10-02 13:39:18 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  | from ..utils import ( | 
					
						
							|  |  |  |     qualities, | 
					
						
							|  |  |  |     determine_ext, | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class TeacherTubeIE(InfoExtractor): | 
					
						
							|  |  |  |     IE_NAME = 'teachertube' | 
					
						
							|  |  |  |     IE_DESC = 'teachertube.com videos' | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-03 21:11:56 +07:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?teachertube\.com/(viewVideo\.php\?video_id=|music\.php\?music_id=|video/(?:[\da-z-]+-)?|audio/)(?P<id>\d+)' | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     _TESTS = [{ | 
					
						
							|  |  |  |         'url': 'http://www.teachertube.com/viewVideo.php?video_id=339997', | 
					
						
							|  |  |  |         'md5': 'f9434ef992fd65936d72999951ee254c', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '339997', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'title': 'Measures of dispersion from a frequency table', | 
					
						
							|  |  |  |             'description': 'Measures of dispersion from a frequency table', | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |             'thumbnail': 're:http://.*\.jpg', | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.teachertube.com/viewVideo.php?video_id=340064', | 
					
						
							|  |  |  |         'md5': '0d625ec6bc9bf50f70170942ad580676', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '340064', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'How to Make Paper Dolls _ Paper Art Projects', | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'description': 'Learn how to make paper dolls in this simple', | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |             'thumbnail': 're:http://.*\.jpg', | 
					
						
							|  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.teachertube.com/music.php?music_id=8805', | 
					
						
							|  |  |  |         'md5': '01e8352006c65757caf7b961f6050e21', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '8805', | 
					
						
							|  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |             'title': 'PER ASPERA AD ASTRA', | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'description': 'RADIJSKA EMISIJA ZRAKOPLOVNE TEHNI?KE ?KOLE P', | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-07-03 21:11:56 +07:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.teachertube.com/video/intro-video-schleicher-297790', | 
					
						
							|  |  |  |         'md5': '9c79fbb2dd7154823996fc28d4a26998', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '297790', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Intro Video - Schleicher', | 
					
						
							|  |  |  |             'description': 'Intro Video - Why to flip, how flipping will', | 
					
						
							|  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |     }] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-01-07 11:43:20 +01:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |         title = self._html_search_meta('title', webpage, 'title', fatal=True) | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |         TITLE_SUFFIX = ' - TeacherTube' | 
					
						
							|  |  |  |         if title.endswith(TITLE_SUFFIX): | 
					
						
							|  |  |  |             title = title[:-len(TITLE_SUFFIX)].strip() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         description = self._html_search_meta('description', webpage, 'description') | 
					
						
							|  |  |  |         if description: | 
					
						
							|  |  |  |             description = description.strip() | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         quality = qualities(['mp3', 'flv', 'mp4']) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |         media_urls = re.findall(r'data-contenturl="([^"]+)"', webpage) | 
					
						
							|  |  |  |         media_urls.extend(re.findall(r'var\s+filePath\s*=\s*"([^"]+)"', webpage)) | 
					
						
							| 
									
										
										
										
											2014-06-26 20:00:47 +07:00
										 |  |  |         media_urls.extend(re.findall(r'\'file\'\s*:\s*["\']([^"\']+)["\'],', webpage)) | 
					
						
							| 
									
										
										
										
											2014-06-08 22:16:48 +07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         formats = [ | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 'url': media_url, | 
					
						
							|  |  |  |                 'quality': quality(determine_ext(media_url)) | 
					
						
							| 
									
										
										
										
											2014-06-08 22:16:48 +07:00
										 |  |  |             } for media_url in set(media_urls) | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         ] | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'title': title, | 
					
						
							| 
									
										
										
										
											2014-06-26 20:00:47 +07:00
										 |  |  |             'thumbnail': self._html_search_regex(r'\'image\'\s*:\s*["\']([^"\']+)["\']', webpage, 'thumbnail'), | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'description': description, | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  | class TeacherTubeUserIE(InfoExtractor): | 
					
						
							|  |  |  |     IE_NAME = 'teachertube:user:collection' | 
					
						
							|  |  |  |     IE_DESC = 'teachertube.com user and collection videos' | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?teachertube\.com/(user/profile|collection)/(?P<user>[0-9a-zA-Z]+)/?' | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |     _MEDIA_RE = r'''(?sx)
 | 
					
						
							|  |  |  |         class="?sidebar_thumb_time"?>[0-9:]+</div> | 
					
						
							|  |  |  |         \s* | 
					
						
							|  |  |  |         <a\s+href="(https?://(?:www\.)?teachertube\.com/(?:video|audio)/[^"]+)" | 
					
						
							|  |  |  |     '''
 | 
					
						
							| 
									
										
										
										
											2014-08-28 00:58:24 +02:00
										 |  |  |     _TEST = { | 
					
						
							|  |  |  |         'url': 'http://www.teachertube.com/user/profile/rbhagwati2', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': 'rbhagwati2' | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'playlist_mincount': 179, | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2014-07-03 21:08:44 +07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         user_id = mobj.group('user') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  |         urls = [] | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, user_id) | 
					
						
							| 
									
										
										
										
											2014-07-03 21:08:44 +07:00
										 |  |  |         urls.extend(re.findall(self._MEDIA_RE, webpage)) | 
					
						
							| 
									
										
										
										
											2014-11-23 20:41:03 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |         pages = re.findall(r'/ajax-user/user-videos/%s\?page=([0-9]+)' % user_id, webpage)[:-1] | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  |         for p in pages: | 
					
						
							|  |  |  |             more = 'http://www.teachertube.com/ajax-user/user-videos/%s?page=%s' % (user_id, p) | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |             webpage = self._download_webpage(more, user_id, 'Downloading page %s/%s' % (p, len(pages))) | 
					
						
							|  |  |  |             video_urls = re.findall(self._MEDIA_RE, webpage) | 
					
						
							|  |  |  |             urls.extend(video_urls) | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |         entries = [self.url_result(vurl, 'TeacherTube') for vurl in urls] | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         return self.playlist_result(entries, user_id) |