| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-02-17 21:23:09 +01:00
										 |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  | from ..utils import ( | 
					
						
							|  |  |  |     xpath_text, | 
					
						
							|  |  |  |     int_or_none, | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-02-17 21:23:09 +01:00
										 |  |  | class WallaIE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |     _VALID_URL = r'http://vod\.walla\.co\.il/[^/]+/(?P<id>\d+)/(?P<display_id>.+)' | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  |     _TEST = { | 
					
						
							|  |  |  |         'url': 'http://vod.walla.co.il/movie/2642630/one-direction-all-for-one', | 
					
						
							|  |  |  |         'info_dict': { | 
					
						
							|  |  |  |             'id': '2642630', | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |             'display_id': 'one-direction-all-for-one', | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  |             'ext': 'flv', | 
					
						
							|  |  |  |             'title': 'וואן דיירקשן: ההיסטריה', | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |             'description': 'md5:de9e2512a92442574cdb0913c49bc4d8', | 
					
						
							|  |  |  |             'thumbnail': 're:^https?://.*\.jpg', | 
					
						
							|  |  |  |             'duration': 3600, | 
					
						
							|  |  |  |         }, | 
					
						
							|  |  |  |         'params': { | 
					
						
							|  |  |  |             # rtmp download | 
					
						
							|  |  |  |             'skip_download': True, | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |     _SUBTITLE_LANGS = { | 
					
						
							|  |  |  |         'עברית': 'heb', | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							|  |  |  |         video_id = mobj.group('id') | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |         display_id = mobj.group('display_id') | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |         video = self._download_xml( | 
					
						
							|  |  |  |             'http://video2.walla.co.il/?w=null/null/%s/@@/video/flv_pl' % video_id, | 
					
						
							|  |  |  |             display_id) | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |         item = video.find('./items/item') | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |         title = xpath_text(item, './title', 'title') | 
					
						
							|  |  |  |         description = xpath_text(item, './synopsis', 'description') | 
					
						
							|  |  |  |         thumbnail = xpath_text(item, './preview_pic', 'thumbnail') | 
					
						
							|  |  |  |         duration = int_or_none(xpath_text(item, './duration', 'duration')) | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | 
 | 
					
						
							|  |  |  |         subtitles = {} | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |         for subtitle in item.findall('./subtitles/subtitle'): | 
					
						
							|  |  |  |             lang = xpath_text(subtitle, './title') | 
					
						
							| 
									
										
										
										
											2015-02-17 21:23:09 +01:00
										 |  |  |             subtitles[self._SUBTITLE_LANGS.get(lang, lang)] = [{ | 
					
						
							|  |  |  |                 'ext': 'srt', | 
					
						
							|  |  |  |                 'url': xpath_text(subtitle, './src'), | 
					
						
							|  |  |  |             }] | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  | 
 | 
					
						
							|  |  |  |         formats = [] | 
					
						
							|  |  |  |         for quality in item.findall('./qualities/quality'): | 
					
						
							|  |  |  |             format_id = xpath_text(quality, './title') | 
					
						
							|  |  |  |             fmt = { | 
					
						
							|  |  |  |                 'url': 'rtmp://wafla.walla.co.il/vod', | 
					
						
							|  |  |  |                 'play_path': xpath_text(quality, './src'), | 
					
						
							|  |  |  |                 'player_url': 'http://isc.walla.co.il/w9/swf/video_swf/vod/WallaMediaPlayerAvod.swf', | 
					
						
							|  |  |  |                 'page_url': url, | 
					
						
							|  |  |  |                 'ext': 'flv', | 
					
						
							|  |  |  |                 'format_id': xpath_text(quality, './title'), | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |             m = re.search(r'^(?P<height>\d+)[Pp]', format_id) | 
					
						
							|  |  |  |             if m: | 
					
						
							|  |  |  |                 fmt['height'] = int(m.group('height')) | 
					
						
							|  |  |  |             formats.append(fmt) | 
					
						
							|  |  |  |         self._sort_formats(formats) | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							|  |  |  |             'id': video_id, | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |             'display_id': display_id, | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  |             'title': title, | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |             'description': description, | 
					
						
							|  |  |  |             'thumbnail': thumbnail, | 
					
						
							|  |  |  |             'duration': duration, | 
					
						
							|  |  |  |             'formats': formats, | 
					
						
							| 
									
										
										
										
											2014-10-01 23:45:35 +03:00
										 |  |  |             'subtitles': subtitles, | 
					
						
							| 
									
										
										
										
											2014-10-07 22:23:05 +07:00
										 |  |  |         } |