mirror of
				https://gitlab.com/ytdl-org/youtube-dl.git
				synced 2025-11-04 02:27:11 -05:00 
			
		
		
		
	
		
			
				
	
	
		
			85 lines
		
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			85 lines
		
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
# encoding: utf-8
 | 
						|
from __future__ import unicode_literals
 | 
						|
 | 
						|
import re
 | 
						|
import base64
 | 
						|
 | 
						|
from .common import InfoExtractor
 | 
						|
from ..utils import (
 | 
						|
    struct_unpack,
 | 
						|
)
 | 
						|
 | 
						|
 | 
						|
class RTVEALaCartaIE(InfoExtractor):
 | 
						|
    IE_NAME = 'rtve.es:alacarta'
 | 
						|
    IE_DESC = 'RTVE a la carta'
 | 
						|
    _VALID_URL = r'http://www\.rtve\.es/alacarta/videos/[^/]+/[^/]+/(?P<id>\d+)'
 | 
						|
 | 
						|
    _TEST = {
 | 
						|
        'url': 'http://www.rtve.es/alacarta/videos/balonmano/o-swiss-cup-masculina-final-espana-suecia/2491869/',
 | 
						|
        'md5': '1d49b7e1ca7a7502c56a4bf1b60f1b43',
 | 
						|
        'info_dict': {
 | 
						|
            'id': '2491869',
 | 
						|
            'ext': 'mp4',
 | 
						|
            'title': 'Balonmano - Swiss Cup masculina. Final: EspaƱa-Suecia',
 | 
						|
        },
 | 
						|
    }
 | 
						|
 | 
						|
    def _decrypt_url(self, png):
 | 
						|
        encrypted_data = base64.b64decode(png)
 | 
						|
        text_index = encrypted_data.find(b'tEXt')
 | 
						|
        text_chunk = encrypted_data[text_index-4:]
 | 
						|
        length = struct_unpack('!I', text_chunk[:4])[0]
 | 
						|
        # Use bytearray to get integers when iterating in both python 2.x and 3.x
 | 
						|
        data = bytearray(text_chunk[8:8+length])
 | 
						|
        data = [chr(b) for b in data if b != 0]
 | 
						|
        hash_index = data.index('#')
 | 
						|
        alphabet_data = data[:hash_index]
 | 
						|
        url_data = data[hash_index+1:]
 | 
						|
 | 
						|
        alphabet = []
 | 
						|
        e = 0
 | 
						|
        d = 0
 | 
						|
        for l in alphabet_data:
 | 
						|
            if d == 0:
 | 
						|
                alphabet.append(l)
 | 
						|
                d = e = (e + 1) % 4
 | 
						|
            else:
 | 
						|
                d -= 1
 | 
						|
        url = ''
 | 
						|
        f = 0
 | 
						|
        e = 3
 | 
						|
        b = 1
 | 
						|
        for letter in url_data:
 | 
						|
            if f == 0:
 | 
						|
                l = int(letter)*10
 | 
						|
                f = 1
 | 
						|
            else:
 | 
						|
                if e == 0:
 | 
						|
                    l += int(letter)
 | 
						|
                    url += alphabet[l]
 | 
						|
                    e = (b + 3) % 4
 | 
						|
                    f = 0
 | 
						|
                    b += 1
 | 
						|
                else:
 | 
						|
                    e -= 1
 | 
						|
 | 
						|
        return url
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        mobj = re.match(self._VALID_URL, url)
 | 
						|
        video_id = mobj.group('id')
 | 
						|
        info = self._download_json(
 | 
						|
            'http://www.rtve.es/api/videos/%s/config/alacarta_videos.json' % video_id,
 | 
						|
            video_id)['page']['items'][0]
 | 
						|
        png_url = 'http://www.rtve.es/ztnr/movil/thumbnail/default/videos/%s.png' % video_id
 | 
						|
        png = self._download_webpage(png_url, video_id, 'Downloading url information')
 | 
						|
        video_url = self._decrypt_url(png)
 | 
						|
 | 
						|
        return {
 | 
						|
            'id': video_id,
 | 
						|
            'title': info['title'],
 | 
						|
            'url': video_url,
 | 
						|
            'thumbnail': info['image'],
 | 
						|
        }
 |