| 
									
										
										
										
											2016-10-02 13:39:18 +02:00
										 |  |  | # coding: utf-8 | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  | from ..utils import ( | 
					
						
							|  |  |  |     clean_html, | 
					
						
							|  |  |  |     determine_ext, | 
					
						
							|  |  |  |     int_or_none, | 
					
						
							|  |  |  |     parse_iso8601, | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class PatreonIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?patreon\.com/(?:creation\?hid=|posts/(?:[\w-]+-)?)(?P<id>\d+)' | 
					
						
							|  |  |  |     _TESTS = [{ | 
					
						
							|  |  |  |         'url': 'http://www.patreon.com/creation?hid=743933', | 
					
						
							|  |  |  |         'md5': 'e25505eec1053a6e6813b8ed369875cc', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '743933', | 
					
						
							|  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |             'title': 'Episode 166: David Smalley of Dogma Debate', | 
					
						
							|  |  |  |             'description': 'md5:713b08b772cd6271b9f3906683cfacdf', | 
					
						
							|  |  |  |             'uploader': 'Cognitive Dissonance Podcast', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*$', | 
					
						
							|  |  |  |             'timestamp': 1406473987, | 
					
						
							|  |  |  |             'upload_date': '20140727', | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'http://www.patreon.com/creation?hid=754133', | 
					
						
							|  |  |  |         'md5': '3eb09345bf44bf60451b8b0b81759d0a', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '754133', | 
					
						
							|  |  |  |             'ext': 'mp3', | 
					
						
							|  |  |  |             'title': 'CD 167 Extra', | 
					
						
							|  |  |  |             'uploader': 'Cognitive Dissonance Podcast', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*$', | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  |         }, | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |         'skip': 'Patron-only content', | 
					
						
							|  |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'https://www.patreon.com/creation?hid=1682498', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': 'SU4fj_aEMVw', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'title': 'I\'m on Patreon!', | 
					
						
							|  |  |  |             'uploader': 'TraciJHines', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*$', | 
					
						
							|  |  |  |             'upload_date': '20150211', | 
					
						
							|  |  |  |             'description': 'md5:c5a706b1f687817a3de09db1eb93acd4', | 
					
						
							|  |  |  |             'uploader_id': 'TraciJHines', | 
					
						
							| 
									
										
										
										
											2014-08-05 00:26:23 -05:00
										 |  |  |         }, | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |         'params': { | 
					
						
							|  |  |  |             'noplaylist': True, | 
					
						
							|  |  |  |             'skip_download': True, | 
					
						
							| 
									
										
										
										
											2015-02-19 01:04:19 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'https://www.patreon.com/posts/episode-166-of-743933', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }, { | 
					
						
							|  |  |  |         'url': 'https://www.patreon.com/posts/743933', | 
					
						
							|  |  |  |         'only_matching': True, | 
					
						
							|  |  |  |     }] | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # Currently Patreon exposes download URL via hidden CSS, so login is not | 
					
						
							|  |  |  |     # needed. Keeping this commented for when this inevitably changes. | 
					
						
							|  |  |  |     '''
 | 
					
						
							|  |  |  |     def _login(self): | 
					
						
							| 
									
										
										
										
											2018-05-26 16:12:44 +01:00
										 |  |  |         username, password = self._get_login_info() | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  |         if username is None: | 
					
						
							|  |  |  |             return | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         login_form = { | 
					
						
							|  |  |  |             'redirectUrl': 'http://www.patreon.com/', | 
					
						
							|  |  |  |             'email': username, | 
					
						
							|  |  |  |             'password': password, | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-11-21 22:18:17 +06:00
										 |  |  |         request = sanitized_Request( | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  |             'https://www.patreon.com/processLogin', | 
					
						
							| 
									
										
										
										
											2016-03-26 01:46:57 +06:00
										 |  |  |             compat_urllib_parse_urlencode(login_form).encode('utf-8') | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  |         ) | 
					
						
							| 
									
										
										
										
											2017-11-11 20:49:03 +07:00
										 |  |  |         login_page = self._download_webpage(request, None, note='Logging in') | 
					
						
							| 
									
										
										
										
											2014-07-28 13:40:58 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  |         if re.search(r'onLoginFailed', login_page): | 
					
						
							|  |  |  |             raise ExtractorError('Unable to login, incorrect username and/or password', expected=True) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_initialize(self): | 
					
						
							|  |  |  |         self._login() | 
					
						
							|  |  |  |     '''
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-02-19 00:38:05 +01:00
										 |  |  |         video_id = self._match_id(url) | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |         post = self._download_json( | 
					
						
							|  |  |  |             'https://www.patreon.com/api/posts/' + video_id, video_id) | 
					
						
							|  |  |  |         attributes = post['data']['attributes'] | 
					
						
							|  |  |  |         title = attributes['title'].strip() | 
					
						
							|  |  |  |         image = attributes.get('image') or {} | 
					
						
							|  |  |  |         info = { | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  |             'id': video_id, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |             'description': clean_html(attributes.get('content')), | 
					
						
							|  |  |  |             'thumbnail': image.get('large_url') or image.get('url'), | 
					
						
							|  |  |  |             'timestamp': parse_iso8601(attributes.get('published_at')), | 
					
						
							|  |  |  |             'like_count': int_or_none(attributes.get('like_count')), | 
					
						
							|  |  |  |             'comment_count': int_or_none(attributes.get('comment_count')), | 
					
						
							| 
									
										
										
										
											2014-08-22 02:33:29 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-10-05 22:45:04 +01:00
										 |  |  |         def add_file(file_data): | 
					
						
							|  |  |  |             file_url = file_data.get('url') | 
					
						
							|  |  |  |             if file_url: | 
					
						
							|  |  |  |                 info.update({ | 
					
						
							|  |  |  |                     'url': file_url, | 
					
						
							|  |  |  |                     'ext': determine_ext(file_data.get('name'), 'mp3'), | 
					
						
							|  |  |  |                 }) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |         for i in post.get('included', []): | 
					
						
							|  |  |  |             i_type = i.get('type') | 
					
						
							|  |  |  |             if i_type == 'attachment': | 
					
						
							| 
									
										
										
										
											2018-10-05 22:45:04 +01:00
										 |  |  |                 add_file(i.get('attributes') or {}) | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |             elif i_type == 'user': | 
					
						
							|  |  |  |                 user_attributes = i.get('attributes') | 
					
						
							|  |  |  |                 if user_attributes: | 
					
						
							|  |  |  |                     info.update({ | 
					
						
							|  |  |  |                         'uploader': user_attributes.get('full_name'), | 
					
						
							|  |  |  |                         'uploader_url': user_attributes.get('url'), | 
					
						
							|  |  |  |                     }) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-10-05 22:45:04 +01:00
										 |  |  |         if not info.get('url'): | 
					
						
							|  |  |  |             add_file(attributes.get('post_file') or {}) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-10-05 20:11:01 +01:00
										 |  |  |         if not info.get('url'): | 
					
						
							|  |  |  |             info.update({ | 
					
						
							|  |  |  |                 '_type': 'url', | 
					
						
							|  |  |  |                 'url': attributes['embed']['url'], | 
					
						
							|  |  |  |             }) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return info |