| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import base64 | 
					
						
							| 
									
										
										
										
											2015-11-15 02:25:00 +06:00
										 |  |  | import re | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2015-04-09 19:53:00 +06:00
										 |  |  | from ..compat import compat_urllib_request | 
					
						
							| 
									
										
										
										
											2015-03-30 20:11:51 +06:00
										 |  |  | from ..utils import qualities | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class DumpertIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2015-11-15 02:25:00 +06:00
										 |  |  |     _VALID_URL = r'(?P<protocol>https?)://(?:www\.)?dumpert\.nl/(?:mediabase|embed)/(?P<id>[0-9]+/[0-9a-zA-Z]+)' | 
					
						
							| 
									
										
										
										
											2015-09-01 18:13:33 +02:00
										 |  |  |     _TESTS = [{ | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  |         'url': 'http://www.dumpert.nl/mediabase/6646981/951bc60f/', | 
					
						
							|  |  |  |         'md5': '1b9318d7d5054e7dcb9dc7654f21d643', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '6646981/951bc60f', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'Ik heb nieuws voor je', | 
					
						
							| 
									
										
										
										
											2015-03-30 20:11:51 +06:00
										 |  |  |             'description': 'Niet schrikken hoor', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2015-09-01 18:13:33 +02:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.dumpert.nl/embed/6675421/dc440fe7/', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-11-15 02:25:00 +06:00
										 |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         video_id = mobj.group('id') | 
					
						
							|  |  |  |         protocol = mobj.group('protocol') | 
					
						
							| 
									
										
										
										
											2015-04-09 19:53:00 +06:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-11-15 02:25:00 +06:00
										 |  |  |         url = '%s://www.dumpert.nl/mediabase/%s' % (protocol, video_id) | 
					
						
							| 
									
										
										
										
											2015-04-09 19:53:00 +06:00
										 |  |  |         req = compat_urllib_request.Request(url) | 
					
						
							| 
									
										
										
										
											2015-05-11 21:05:39 +06:00
										 |  |  |         req.add_header('Cookie', 'nsfw=1; cpc=10') | 
					
						
							| 
									
										
										
										
											2015-04-09 19:53:00 +06:00
										 |  |  |         webpage = self._download_webpage(req, video_id) | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-30 20:11:51 +06:00
										 |  |  |         files_base64 = self._search_regex( | 
					
						
							|  |  |  |             r'data-files="([^"]+)"', webpage, 'data files') | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-30 20:11:51 +06:00
										 |  |  |         files = self._parse_json( | 
					
						
							|  |  |  |             base64.b64decode(files_base64.encode('utf-8')).decode('utf-8'), | 
					
						
							|  |  |  |             video_id) | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-03-30 20:11:51 +06:00
										 |  |  |         quality = qualities(['flv', 'mobile', 'tablet', '720p']) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         formats = [{ | 
					
						
							|  |  |  |             'url': video_url, | 
					
						
							|  |  |  |             'format_id': format_id, | 
					
						
							|  |  |  |             'quality': quality(format_id), | 
					
						
							|  |  |  |         } for format_id, video_url in files.items() if format_id != 'still'] | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         title = self._html_search_meta( | 
					
						
							|  |  |  |             'title', webpage) or self._og_search_title(webpage) | 
					
						
							|  |  |  |         description = self._html_search_meta( | 
					
						
							|  |  |  |             'description', webpage) or self._og_search_description(webpage) | 
					
						
							|  |  |  |         thumbnail = files.get('still') or self._og_search_thumbnail(webpage) | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'description': description, | 
					
						
							| 
									
										
										
										
											2015-03-30 20:11:51 +06:00
										 |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2015-03-29 23:41:06 +02:00
										 |  |  |             'formats': formats | 
					
						
							|  |  |  |         } |