85 lines
		
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
		
		
			
		
	
	
			85 lines
		
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| 
								 | 
							
								# encoding: utf-8
							 | 
						||
| 
								 | 
							
								from __future__ import unicode_literals
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								import re
							 | 
						||
| 
								 | 
							
								import base64
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								from .common import InfoExtractor
							 | 
						||
| 
								 | 
							
								from ..utils import (
							 | 
						||
| 
								 | 
							
								    struct_unpack,
							 | 
						||
| 
								 | 
							
								)
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								class RTVEALaCartaIE(InfoExtractor):
							 | 
						||
| 
								 | 
							
								    IE_NAME = 'rtve.es:alacarta'
							 | 
						||
| 
								 | 
							
								    IE_DESC = 'RTVE a la carta'
							 | 
						||
| 
								 | 
							
								    _VALID_URL = r'http://www\.rtve\.es/alacarta/videos/[^/]+/[^/]+/(?P<id>\d+)'
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    _TEST = {
							 | 
						||
| 
								 | 
							
								        'url': 'http://www.rtve.es/alacarta/videos/balonmano/o-swiss-cup-masculina-final-espana-suecia/2491869/',
							 | 
						||
| 
								 | 
							
								        'md5': '18fcd45965bdd076efdb12cd7f6d7b9e',
							 | 
						||
| 
								 | 
							
								        'info_dict': {
							 | 
						||
| 
								 | 
							
								            'id': '2491869',
							 | 
						||
| 
								 | 
							
								            'ext': 'mp4',
							 | 
						||
| 
								 | 
							
								            'title': 'Balonmano - Swiss Cup masculina. Final: España-Suecia',
							 | 
						||
| 
								 | 
							
								        },
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    def _decrypt_url(self, png):
							 | 
						||
| 
								 | 
							
								        encrypted_data = base64.b64decode(png)
							 | 
						||
| 
								 | 
							
								        text_index = encrypted_data.find(b'tEXt')
							 | 
						||
| 
								 | 
							
								        text_chunk = encrypted_data[text_index-4:]
							 | 
						||
| 
								 | 
							
								        length = struct_unpack('!I', text_chunk[:4])[0]
							 | 
						||
| 
								 | 
							
								        # Use bytearray to get integers when iterating in both python 2.x and 3.x
							 | 
						||
| 
								 | 
							
								        data = bytearray(text_chunk[8:8+length])
							 | 
						||
| 
								 | 
							
								        data = [chr(b) for b in data if b != 0]
							 | 
						||
| 
								 | 
							
								        hash_index = data.index('#')
							 | 
						||
| 
								 | 
							
								        alphabet_data = data[:hash_index]
							 | 
						||
| 
								 | 
							
								        url_data = data[hash_index+1:]
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        alphabet = []
							 | 
						||
| 
								 | 
							
								        e = 0
							 | 
						||
| 
								 | 
							
								        d = 0
							 | 
						||
| 
								 | 
							
								        for l in alphabet_data:
							 | 
						||
| 
								 | 
							
								            if d == 0:
							 | 
						||
| 
								 | 
							
								                alphabet.append(l)
							 | 
						||
| 
								 | 
							
								                d = e = (e + 1) % 4
							 | 
						||
| 
								 | 
							
								            else:
							 | 
						||
| 
								 | 
							
								                d -= 1
							 | 
						||
| 
								 | 
							
								        url = ''
							 | 
						||
| 
								 | 
							
								        f = 0
							 | 
						||
| 
								 | 
							
								        e = 3
							 | 
						||
| 
								 | 
							
								        b = 1
							 | 
						||
| 
								 | 
							
								        for letter in url_data:
							 | 
						||
| 
								 | 
							
								            if f == 0:
							 | 
						||
| 
								 | 
							
								                l = int(letter)*10
							 | 
						||
| 
								 | 
							
								                f = 1
							 | 
						||
| 
								 | 
							
								            else:
							 | 
						||
| 
								 | 
							
								                if e == 0:
							 | 
						||
| 
								 | 
							
								                    l += int(letter)
							 | 
						||
| 
								 | 
							
								                    url += alphabet[l]
							 | 
						||
| 
								 | 
							
								                    e = (b + 3) % 4
							 | 
						||
| 
								 | 
							
								                    f = 0
							 | 
						||
| 
								 | 
							
								                    b += 1
							 | 
						||
| 
								 | 
							
								                else:
							 | 
						||
| 
								 | 
							
								                    e -= 1
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        return url
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    def _real_extract(self, url):
							 | 
						||
| 
								 | 
							
								        mobj = re.match(self._VALID_URL, url)
							 | 
						||
| 
								 | 
							
								        video_id = mobj.group('id')
							 | 
						||
| 
								 | 
							
								        info = self._download_json(
							 | 
						||
| 
								 | 
							
								            'http://www.rtve.es/api/videos/%s/config/alacarta_videos.json' % video_id,
							 | 
						||
| 
								 | 
							
								            video_id)['page']['items'][0]
							 | 
						||
| 
								 | 
							
								        png_url = 'http://www.rtve.es/ztnr/movil/thumbnail/default/videos/%s.png' % video_id
							 | 
						||
| 
								 | 
							
								        png = self._download_webpage(png_url, video_id, 'Downloading url information')
							 | 
						||
| 
								 | 
							
								        video_url = self._decrypt_url(png)
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        return {
							 | 
						||
| 
								 | 
							
								            'id': video_id,
							 | 
						||
| 
								 | 
							
								            'title': info['title'],
							 | 
						||
| 
								 | 
							
								            'url': video_url,
							 | 
						||
| 
								 | 
							
								            'thumbnail': info['image'],
							 | 
						||
| 
								 | 
							
								        }
							 |