| 
									
										
										
										
											2016-10-02 13:39:18 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  | from ..utils import ( | 
					
						
							|  |  |  |     determine_ext, | 
					
						
							| 
									
										
										
										
											2018-01-24 22:46:04 +07:00
										 |  |  |     ExtractorError, | 
					
						
							|  |  |  |     qualities, | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  | ) | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class TeacherTubeIE(InfoExtractor): | 
					
						
							|  |  |  |     IE_NAME = 'teachertube' | 
					
						
							|  |  |  |     IE_DESC = 'teachertube.com videos' | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-03 21:11:56 +07:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?teachertube\.com/(viewVideo\.php\?video_id=|music\.php\?music_id=|video/(?:[\da-z-]+-)?|audio/)(?P<id>\d+)' | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |         # flowplayer | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         'url': 'http://www.teachertube.com/viewVideo.php?video_id=339997', | 
					
						
							|  |  |  |         'md5': 'f9434ef992fd65936d72999951ee254c', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '339997', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'title': 'Measures of dispersion from a frequency table', | 
					
						
							|  |  |  |             'description': 'Measures of dispersion from a frequency table', | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |             'thumbnail': r're:https?://.*\.(?:jpg|png)', | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |     }, { | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |         # jwplayer | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         'url': 'http://www.teachertube.com/music.php?music_id=8805', | 
					
						
							|  |  |  |         'md5': '01e8352006c65757caf7b961f6050e21', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '8805', | 
					
						
							|  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |             'title': 'PER ASPERA AD ASTRA', | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'description': 'RADIJSKA EMISIJA ZRAKOPLOVNE TEHNI?KE ?KOLE P', | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-07-03 21:11:56 +07:00
										 |  |  |     }, { | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |         # unavailable video | 
					
						
							| 
									
										
										
										
											2014-07-03 21:11:56 +07:00
										 |  |  |         'url': 'http://www.teachertube.com/video/intro-video-schleicher-297790', | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |         'only_matching': True, | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |     }] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-01-07 11:43:20 +01:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-01-24 22:46:04 +07:00
										 |  |  |         error = self._search_regex( | 
					
						
							|  |  |  |             r'<div\b[^>]+\bclass=["\']msgBox error[^>]+>([^<]+)', webpage, | 
					
						
							|  |  |  |             'error', default=None) | 
					
						
							|  |  |  |         if error: | 
					
						
							|  |  |  |             raise ExtractorError('%s said: %s' % (self.IE_NAME, error), expected=True) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |         title = self._html_search_meta('title', webpage, 'title', fatal=True) | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |         TITLE_SUFFIX = ' - TeacherTube' | 
					
						
							|  |  |  |         if title.endswith(TITLE_SUFFIX): | 
					
						
							|  |  |  |             title = title[:-len(TITLE_SUFFIX)].strip() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         description = self._html_search_meta('description', webpage, 'description') | 
					
						
							|  |  |  |         if description: | 
					
						
							|  |  |  |             description = description.strip() | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         quality = qualities(['mp3', 'flv', 'mp4']) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |         media_urls = re.findall(r'data-contenturl="([^"]+)"', webpage) | 
					
						
							|  |  |  |         media_urls.extend(re.findall(r'var\s+filePath\s*=\s*"([^"]+)"', webpage)) | 
					
						
							| 
									
										
										
										
											2014-06-26 20:00:47 +07:00
										 |  |  |         media_urls.extend(re.findall(r'\'file\'\s*:\s*["\']([^"\']+)["\'],', webpage)) | 
					
						
							| 
									
										
										
										
											2014-06-08 22:16:48 +07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         formats = [ | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 'url': media_url, | 
					
						
							|  |  |  |                 'quality': quality(determine_ext(media_url)) | 
					
						
							| 
									
										
										
										
											2014-06-08 22:16:48 +07:00
										 |  |  |             } for media_url in set(media_urls) | 
					
						
							| 
									
										
										
										
											2014-06-07 20:32:23 +07:00
										 |  |  |         ] | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |         thumbnail = self._og_search_thumbnail( | 
					
						
							|  |  |  |             webpage, default=None) or self._html_search_meta( | 
					
						
							|  |  |  |             'thumbnail', webpage) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							| 
									
										
										
										
											2014-06-23 03:07:10 +07:00
										 |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							| 
									
										
										
										
											2018-01-24 22:41:25 +07:00
										 |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  | class TeacherTubeUserIE(InfoExtractor): | 
					
						
							|  |  |  |     IE_NAME = 'teachertube:user:collection' | 
					
						
							|  |  |  |     IE_DESC = 'teachertube.com user and collection videos' | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?teachertube\.com/(user/profile|collection)/(?P<user>[0-9a-zA-Z]+)/?' | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |     _MEDIA_RE = r'''(?sx)
 | 
					
						
							|  |  |  |         class="?sidebar_thumb_time"?>[0-9:]+</div> | 
					
						
							|  |  |  |         \s* | 
					
						
							|  |  |  |         <a\s+href="(https?://(?:www\.)?teachertube\.com/(?:video|audio)/[^"]+)" | 
					
						
							|  |  |  |     '''
 | 
					
						
							| 
									
										
										
										
											2014-08-28 00:58:24 +02:00
										 |  |  |     _TEST = { | 
					
						
							|  |  |  |         'url': 'http://www.teachertube.com/user/profile/rbhagwati2', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': 'rbhagwati2' | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'playlist_mincount': 179, | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2014-07-03 21:08:44 +07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         user_id = mobj.group('user') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  |         urls = [] | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, user_id) | 
					
						
							| 
									
										
										
										
											2014-07-03 21:08:44 +07:00
										 |  |  |         urls.extend(re.findall(self._MEDIA_RE, webpage)) | 
					
						
							| 
									
										
										
										
											2014-11-23 20:41:03 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |         pages = re.findall(r'/ajax-user/user-videos/%s\?page=([0-9]+)' % user_id, webpage)[:-1] | 
					
						
							| 
									
										
										
										
											2014-06-29 13:45:10 +02:00
										 |  |  |         for p in pages: | 
					
						
							|  |  |  |             more = 'http://www.teachertube.com/ajax-user/user-videos/%s?page=%s' % (user_id, p) | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |             webpage = self._download_webpage(more, user_id, 'Downloading page %s/%s' % (p, len(pages))) | 
					
						
							|  |  |  |             video_urls = re.findall(self._MEDIA_RE, webpage) | 
					
						
							|  |  |  |             urls.extend(video_urls) | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-07-21 12:47:01 +02:00
										 |  |  |         entries = [self.url_result(vurl, 'TeacherTube') for vurl in urls] | 
					
						
							| 
									
										
										
										
											2014-06-06 11:21:59 +02:00
										 |  |  |         return self.playlist_result(entries, user_id) |