| 
									
										
										
										
											2014-10-27 02:26:05 +01:00
										 |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-16 14:45:14 +02:00
										 |  |  | from .common import InfoExtractor | 
					
						
							|  |  |  | from ..utils import ( | 
					
						
							| 
									
										
										
										
											2013-09-18 23:32:37 +02:00
										 |  |  |     clean_html, | 
					
						
							| 
									
										
										
										
											2015-09-09 10:42:47 +01:00
										 |  |  |     determine_ext, | 
					
						
							| 
									
										
										
										
											2015-12-19 18:26:28 +01:00
										 |  |  |     js_to_json, | 
					
						
							| 
									
										
										
										
											2013-09-16 14:45:14 +02:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-18 23:32:37 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-16 14:45:14 +02:00
										 |  |  | class FKTVIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-10-27 02:26:05 +01:00
										 |  |  |     IE_NAME = 'fernsehkritik.tv' | 
					
						
							| 
									
										
										
										
											2016-03-21 21:36:32 +06:00
										 |  |  |     _VALID_URL = r'https?://(?:www\.)?fernsehkritik\.tv/folge-(?P<id>[0-9]+)(?:/.*)?' | 
					
						
							| 
									
										
										
										
											2013-09-16 14:45:14 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-18 23:32:37 +02:00
										 |  |  |     _TEST = { | 
					
						
							| 
									
										
										
										
											2014-10-27 02:26:05 +01:00
										 |  |  |         'url': 'http://fernsehkritik.tv/folge-1', | 
					
						
							| 
									
										
										
										
											2015-09-09 10:42:47 +01:00
										 |  |  |         'md5': '21f0b0c99bce7d5b524eb1b17b1c6d79', | 
					
						
							| 
									
										
										
										
											2014-10-27 02:26:05 +01:00
										 |  |  |         'info_dict': { | 
					
						
							| 
									
										
										
										
											2015-09-09 10:42:47 +01:00
										 |  |  |             'id': '1', | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-10-27 02:26:05 +01:00
										 |  |  |             'title': 'Folge 1 vom 10. April 2007', | 
					
						
							| 
									
										
										
										
											2015-09-25 17:58:44 +08:00
										 |  |  |             'thumbnail': 're:^https?://.*\.jpg$', | 
					
						
							| 
									
										
										
										
											2013-09-18 23:32:37 +02:00
										 |  |  |         }, | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							| 
									
										
										
										
											2015-09-09 10:42:47 +01:00
										 |  |  |         episode = self._match_id(url) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-09-25 18:01:08 +08:00
										 |  |  |         webpage = self._download_webpage( | 
					
						
							|  |  |  |             'http://fernsehkritik.tv/folge-%s/play' % episode, episode) | 
					
						
							|  |  |  |         title = clean_html(self._html_search_regex( | 
					
						
							|  |  |  |             '<h3>([^<]+)</h3>', webpage, 'title')) | 
					
						
							| 
									
										
										
										
											2015-12-19 18:26:28 +01:00
										 |  |  |         thumbnail = self._search_regex(r'POSTER\s*=\s*"([^"]+)', webpage, 'thumbnail', fatal=False) | 
					
						
							|  |  |  |         sources = self._parse_json(self._search_regex(r'(?s)MEDIA\s*=\s*(\[.+?\]);', webpage, 'media'), episode, js_to_json) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  |         for source in sources: | 
					
						
							|  |  |  |             furl = source.get('src') | 
					
						
							|  |  |  |             if furl: | 
					
						
							|  |  |  |                 formats.append({ | 
					
						
							|  |  |  |                     'url': furl, | 
					
						
							|  |  |  |                     'format_id': determine_ext(furl), | 
					
						
							|  |  |  |                 }) | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-09-25 17:48:51 +08:00
										 |  |  |         return { | 
					
						
							|  |  |  |             'id': episode, | 
					
						
							|  |  |  |             'title': title, | 
					
						
							|  |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2015-12-19 18:26:28 +01:00
										 |  |  |             'thumbnail': thumbnail, | 
					
						
							| 
									
										
										
										
											2015-09-25 17:48:51 +08:00
										 |  |  |         } |