| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class GrouponIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?groupon\.com/deals/(?P<id>[^/?#&]+)' | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |     _TEST = { | 
					
						
							|  |  |  |         'url': 'https://www.groupon.com/deals/bikram-yoga-huntington-beach-2#ooid=tubGNycTo_9Uxg82uESj4i61EYX8nyuf', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': 'bikram-yoga-huntington-beach-2', | 
					
						
							|  |  |  |             'title': '$49 for 10 Yoga Classes or One Month of Unlimited Classes at Bikram Yoga Huntington Beach ($180 Value)', | 
					
						
							|  |  |  |             'description': 'Studio kept at 105 degrees and 40% humidity with anti-microbial and anti-slip Flotex flooring; certified instructors', | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'playlist': [{ | 
					
						
							| 
									
										
										
										
											2016-05-24 11:24:29 +01:00
										 |  |  |             'md5': '42428ce8a00585f9bc36e49226eae7a1', | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |             'info_dict': { | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |                 'id': 'fk6OhWpXgIQ', | 
					
						
							|  |  |  |                 'ext': 'mp4', | 
					
						
							|  |  |  |                 'title': 'Bikram Yoga Huntington Beach | Orange County !tubGNycTo@9Uxg82uESj4i61EYX8nyuf', | 
					
						
							| 
									
										
										
										
											2015-10-16 16:02:40 +01:00
										 |  |  |                 'description': 'md5:d41d8cd98f00b204e9800998ecf8427e', | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |                 'duration': 45, | 
					
						
							|  |  |  |                 'upload_date': '20160405', | 
					
						
							|  |  |  |                 'uploader_id': 'groupon', | 
					
						
							|  |  |  |                 'uploader': 'Groupon', | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |             }, | 
					
						
							| 
									
										
										
										
											2016-05-24 11:24:29 +01:00
										 |  |  |             'add_ie': ['Youtube'], | 
					
						
							| 
									
										
										
										
											2016-05-24 16:42:22 +01:00
										 |  |  |         }], | 
					
						
							|  |  |  |         'params': { | 
					
						
							|  |  |  |             'skip_download': True, | 
					
						
							|  |  |  |         }, | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |     _PROVIDERS = { | 
					
						
							|  |  |  |         'ooyala': ('ooyala:%s', 'Ooyala'), | 
					
						
							|  |  |  |         'youtube': ('%s', 'Youtube'), | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         playlist_id = self._match_id(url) | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, playlist_id) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         payload = self._parse_json(self._search_regex( | 
					
						
							| 
									
										
										
										
											2016-04-12 17:26:09 +08:00
										 |  |  |             r'(?:var\s+|window\.)payload\s*=\s*(.*?);\n', webpage, 'payload'), playlist_id) | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |         videos = payload['carousel'].get('dealVideos', []) | 
					
						
							|  |  |  |         entries = [] | 
					
						
							|  |  |  |         for v in videos: | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |             provider = v.get('provider') | 
					
						
							|  |  |  |             video_id = v.get('media') or v.get('id') or v.get('baseURL') | 
					
						
							|  |  |  |             if not provider or not video_id: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  |             url_pattern, ie_key = self._PROVIDERS.get(provider.lower()) | 
					
						
							|  |  |  |             if not url_pattern: | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |                 self.report_warning( | 
					
						
							|  |  |  |                     '%s: Unsupported video provider %s, skipping video' % | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |                     (playlist_id, provider)) | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  |                 continue | 
					
						
							| 
									
										
										
										
											2016-05-16 00:30:13 +06:00
										 |  |  |             entries.append(self.url_result(url_pattern % video_id, ie_key)) | 
					
						
							| 
									
										
										
										
											2014-12-12 17:39:33 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             '_type': 'playlist', | 
					
						
							|  |  |  |             'id': playlist_id, | 
					
						
							|  |  |  |             'entries': entries, | 
					
						
							|  |  |  |             'title': self._og_search_title(webpage), | 
					
						
							|  |  |  |             'description': self._og_search_description(webpage), | 
					
						
							|  |  |  |         } |