| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | # coding: utf-8 | 
					
						
							|  |  |  | from __future__ import unicode_literals | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from .common import InfoExtractor | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  | from ..utils import ExtractorError | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class Sport5IE(InfoExtractor): | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |     _VALID_URL = r'http://(?:www|vod)?\.sport5\.co\.il/.*\b(?:Vi|docID)=(?P<id>\d+)' | 
					
						
							|  |  |  |     _TESTS = [ | 
					
						
							|  |  |  |         { | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |             'url': 'http://vod.sport5.co.il/?Vc=147&Vi=176331&Page=1', | 
					
						
							|  |  |  |             'info_dict': { | 
					
						
							|  |  |  |                 'id': 's5-Y59xx1-GUh2', | 
					
						
							|  |  |  |                 'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |                 'title': 'ולנסיה-קורדובה 0:3', | 
					
						
							|  |  |  |                 'description': 'אלקאסר, גאייה ופגולי סידרו לקבוצה של נונו ניצחון על קורדובה ואת המקום הראשון בליגה', | 
					
						
							|  |  |  |                 'duration': 228, | 
					
						
							|  |  |  |                 'categories': list, | 
					
						
							|  |  |  |             }, | 
					
						
							|  |  |  |             'skip': 'Blocked outside of Israel', | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |         }, { | 
					
						
							|  |  |  |             'url': 'http://www.sport5.co.il/articles.aspx?FolderID=3075&docID=176372&lang=HE', | 
					
						
							|  |  |  |             'info_dict': { | 
					
						
							|  |  |  |                 'id': 's5-SiXxx1-hKh2', | 
					
						
							|  |  |  |                 'ext': 'mp4', | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |                 'title': 'GOALS_CELTIC_270914.mp4', | 
					
						
							|  |  |  |                 'description': '', | 
					
						
							|  |  |  |                 'duration': 87, | 
					
						
							|  |  |  |                 'categories': list, | 
					
						
							|  |  |  |             }, | 
					
						
							|  |  |  |             'skip': 'Blocked outside of Israel', | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |         } | 
					
						
							|  |  |  |     ] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _real_extract(self, url): | 
					
						
							|  |  |  |         mobj = re.match(self._VALID_URL, url) | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         media_id = mobj.group('id') | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         webpage = self._download_webpage(url, media_id) | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         video_id = self._html_search_regex('clipId=([\w-]+)', webpage, 'video id') | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         metadata = self._download_xml( | 
					
						
							|  |  |  |             'http://sport5-metadata-rr-d.nsacdn.com/vod/vod/%s/HDS/metadata.xml' % video_id, | 
					
						
							|  |  |  |             video_id) | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         error = metadata.find('./Error') | 
					
						
							|  |  |  |         if error is not None: | 
					
						
							|  |  |  |             raise ExtractorError( | 
					
						
							|  |  |  |                 '%s returned error: %s - %s' % ( | 
					
						
							|  |  |  |                     self.IE_NAME, | 
					
						
							|  |  |  |                     error.find('./Name').text, | 
					
						
							|  |  |  |                     error.find('./Description').text), | 
					
						
							|  |  |  |                 expected=True) | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         title = metadata.find('./Title').text | 
					
						
							|  |  |  |         description = metadata.find('./Description').text | 
					
						
							|  |  |  |         duration = int(metadata.find('./Duration').text) | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         posters_el = metadata.find('./PosterLinks') | 
					
						
							|  |  |  |         thumbnails = [{ | 
					
						
							|  |  |  |             'url': thumbnail.text, | 
					
						
							|  |  |  |             'width': int(thumbnail.get('width')), | 
					
						
							|  |  |  |             'height': int(thumbnail.get('height')), | 
					
						
							|  |  |  |         } for thumbnail in posters_el.findall('./PosterIMG')] if posters_el is not None else [] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         categories_el = metadata.find('./Categories') | 
					
						
							|  |  |  |         categories = [ | 
					
						
							|  |  |  |             cat.get('name') for cat in categories_el.findall('./Category') | 
					
						
							|  |  |  |         ] if categories_el is not None else [] | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |         formats = [{ | 
					
						
							|  |  |  |             'url': fmt.text, | 
					
						
							|  |  |  |             'ext': 'mp4', | 
					
						
							|  |  |  |             'vbr': int(fmt.get('bitrate')), | 
					
						
							|  |  |  |             'width': int(fmt.get('width')), | 
					
						
							|  |  |  |             'height': int(fmt.get('height')), | 
					
						
							|  |  |  |         } for fmt in metadata.findall('./PlaybackLinks/FileURL')] | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |         self._sort_formats(formats) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return { | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |             'id': video_id, | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |             'title': title, | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |             'description': description, | 
					
						
							|  |  |  |             'thumbnails': thumbnails, | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |             'duration': duration, | 
					
						
							| 
									
										
										
										
											2014-09-28 02:31:14 +07:00
										 |  |  |             'categories': categories, | 
					
						
							| 
									
										
										
										
											2014-09-27 20:21:46 +03:00
										 |  |  |             'formats': formats, | 
					
						
							|  |  |  |         } |