mirror of
				https://gitlab.com/ytdl-org/youtube-dl.git
				synced 2025-11-04 01:37:07 -05:00 
			
		
		
		
	It uses a helper method in the InfoExtractor class. The downloader will pick the requested formats using the bitrate in the info dict.
		
			
				
	
	
		
			38 lines
		
	
	
		
			1.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			38 lines
		
	
	
		
			1.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
from __future__ import unicode_literals
 | 
						|
 | 
						|
import re
 | 
						|
 | 
						|
from .common import InfoExtractor
 | 
						|
 | 
						|
 | 
						|
class BloombergIE(InfoExtractor):
 | 
						|
    _VALID_URL = r'https?://www\.bloomberg\.com/video/(?P<name>.+?)\.html'
 | 
						|
 | 
						|
    _TEST = {
 | 
						|
        'url': 'http://www.bloomberg.com/video/shah-s-presentation-on-foreign-exchange-strategies-qurhIVlJSB6hzkVi229d8g.html',
 | 
						|
        # The md5 checksum changes
 | 
						|
        'info_dict': {
 | 
						|
            'id': 'qurhIVlJSB6hzkVi229d8g',
 | 
						|
            'ext': 'flv',
 | 
						|
            'title': 'Shah\'s Presentation on Foreign-Exchange Strategies',
 | 
						|
            'description': 'md5:0681e0d30dcdfc6abf34594961d8ea88',
 | 
						|
        },
 | 
						|
    }
 | 
						|
 | 
						|
    def _real_extract(self, url):
 | 
						|
        mobj = re.match(self._VALID_URL, url)
 | 
						|
        name = mobj.group('name')
 | 
						|
        webpage = self._download_webpage(url, name)
 | 
						|
        f4m_url = self._search_regex(
 | 
						|
            r'<source src="(https?://[^"]+\.f4m.*?)"', webpage,
 | 
						|
            'f4m url')
 | 
						|
        title = re.sub(': Video$', '', self._og_search_title(webpage))
 | 
						|
 | 
						|
        return {
 | 
						|
            'id': name.split('-')[-1],
 | 
						|
            'title': title,
 | 
						|
            'formats': self._extract_f4m_formats(f4m_url, name),
 | 
						|
            'description': self._og_search_description(webpage),
 | 
						|
            'thumbnail': self._og_search_thumbnail(webpage),
 | 
						|
        }
 |