| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | # encoding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  | import json | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  |     compat_urlparse, | 
					
						
							|  |  |  |     js_to_json, | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class PatreonIE(InfoExtractor): | 
					
						
							|  |  |  |     _VALID_URL = r'https?://(?:www\.)?patreon\.com/creation\?hid=(.+)' | 
					
						
							|  |  |  |     _TESTS = [ | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             'url': 'http://www.patreon.com/creation?hid=743933', | 
					
						
							|  |  |  |             'md5': 'e25505eec1053a6e6813b8ed369875cc', | 
					
						
							|  |  |  |             'info_dict': { | 
					
						
							|  |  |  |                 'id': '743933', | 
					
						
							|  |  |  |                 'ext': 'mp3', | 
					
						
							|  |  |  |                 'title': 'Episode 166: David Smalley of Dogma Debate', | 
					
						
							|  |  |  |                 'uploader': 'Cognitive Dissonance Podcast', | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  |                 'thumbnail': 're:^https?://.*$', | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  |             }, | 
					
						
							|  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-08-05 00:26:23 -05:00
										 |  |  |         { | 
					
						
							|  |  |  |             'url': 'http://www.patreon.com/creation?hid=754133', | 
					
						
							|  |  |  |             'md5': '3eb09345bf44bf60451b8b0b81759d0a', | 
					
						
							|  |  |  |             'info_dict': { | 
					
						
							|  |  |  |                 'id': '754133', | 
					
						
							|  |  |  |                 'ext': 'mp3', | 
					
						
							|  |  |  |                 'title': 'CD 167 Extra', | 
					
						
							|  |  |  |                 'uploader': 'Cognitive Dissonance Podcast', | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  |                 'thumbnail': 're:^https?://.*$', | 
					
						
							| 
									
										
										
										
											2014-08-05 00:26:23 -05:00
										 |  |  |             }, | 
					
						
							|  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  |     ] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # Currently Patreon exposes download URL via hidden CSS, so login is not | 
					
						
							|  |  |  |     # needed. Keeping this commented for when this inevitably changes. | 
					
						
							|  |  |  |     '''
 | 
					
						
							|  |  |  |     def _login(self): | 
					
						
							|  |  |  |         (username, password) = self._get_login_info() | 
					
						
							|  |  |  |         if username is None: | 
					
						
							|  |  |  |             return | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         login_form = { | 
					
						
							|  |  |  |             'redirectUrl': 'http://www.patreon.com/', | 
					
						
							|  |  |  |             'email': username, | 
					
						
							|  |  |  |             'password': password, | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         request = compat_urllib_request.Request( | 
					
						
							|  |  |  |             'https://www.patreon.com/processLogin', | 
					
						
							|  |  |  |             compat_urllib_parse.urlencode(login_form).encode('utf-8') | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  |         login_page = self._download_webpage(request, None, note='Logging in as %s' % username) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if re.search(r'onLoginFailed', login_page): | 
					
						
							|  |  |  |             raise ExtractorError('Unable to login, incorrect username and/or password', expected=True) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_initialize(self): | 
					
						
							|  |  |  |         self._login() | 
					
						
							|  |  |  |     '''
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         video_id = mobj.group(1) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  |         webpage = self._download_webpage(url, video_id) | 
					
						
							|  |  |  |         title = self._og_search_title(webpage).strip() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         attach_fn = self._html_search_regex( | 
					
						
							|  |  |  |             r'<div class="attach"><a target="_blank" href="([^"]+)">', | 
					
						
							|  |  |  |             webpage, 'attachment URL', default=None) | 
					
						
							|  |  |  |         if attach_fn is not None: | 
					
						
							|  |  |  |             video_url = 'http://www.patreon.com' + attach_fn | 
					
						
							|  |  |  |             thumbnail = self._og_search_thumbnail(webpage) | 
					
						
							|  |  |  |             uploader = self._html_search_regex( | 
					
						
							|  |  |  |                 r'<strong>(.*?)</strong> is creating', webpage, 'uploader') | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             playlist_js = self._search_regex( | 
					
						
							|  |  |  |                 r'(?s)new\s+jPlayerPlaylist\(\s*\{\s*[^}]*},\s*(\[.*?,?\s*\])', | 
					
						
							|  |  |  |                 webpage, 'playlist JSON') | 
					
						
							|  |  |  |             playlist_json = js_to_json(playlist_js) | 
					
						
							|  |  |  |             playlist = json.loads(playlist_json) | 
					
						
							|  |  |  |             data = playlist[0] | 
					
						
							|  |  |  |             video_url = self._proto_relative_url(data['mp3']) | 
					
						
							|  |  |  |             thumbnail = self._proto_relative_url(data.get('cover')) | 
					
						
							|  |  |  |             uploader = data.get('artist') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'url': video_url, | 
					
						
							|  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'uploader': uploader, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |         } |