| 
									
										
										
										
											2017-04-07 21:52:48 +02:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-04-08 20:08:31 +07:00
										 |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-04-07 21:52:48 +02:00
										 |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from .ooyala import OoyalaIE | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class TheSunIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2017-04-08 20:08:31 +07:00
										 |  |  |     _VALID_URL = r'https://(?:www\.)?thesun\.co\.uk/[^/]+/(?P<id>\d+)' | 
					
						
							| 
									
										
										
										
											2017-04-07 21:52:48 +02:00
										 |  |  |     _TEST = { | 
					
						
							|  |  |  |         'url': 'https://www.thesun.co.uk/tvandshowbiz/2261604/orlando-bloom-and-katy-perry-post-adorable-instagram-video-together-celebrating-thanksgiving-after-split-rumours/', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2017-04-08 20:08:31 +07:00
										 |  |  |             'id': '2261604', | 
					
						
							|  |  |  |             'title': 'md5:cba22f48bad9218b64d5bbe0e16afddf', | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'playlist_count': 2, | 
					
						
							| 
									
										
										
										
											2017-04-07 21:52:48 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2017-04-08 20:08:31 +07:00
										 |  |  |         article_id = self._match_id(url) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         webpage = self._download_webpage(url, article_id) | 
					
						
							| 
									
										
										
										
											2017-04-07 21:52:48 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-04-08 20:08:31 +07:00
										 |  |  |         entries = [] | 
					
						
							|  |  |  |         for ooyala_id in re.findall( | 
					
						
							|  |  |  |                 r'<[^>]+\b(?:id\s*=\s*"thesun-ooyala-player-|data-content-id\s*=\s*")([^"]+)', | 
					
						
							|  |  |  |                 webpage): | 
					
						
							|  |  |  |             entries.append(OoyalaIE._build_url_result(ooyala_id)) | 
					
						
							| 
									
										
										
										
											2017-04-07 21:52:48 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-04-08 20:08:31 +07:00
										 |  |  |         return self.playlist_result( | 
					
						
							|  |  |  |             entries, article_id, self._og_search_title(webpage, fatal=False)) |