mirror of
				https://github.com/ytdl-org/youtube-dl
				synced 2025-11-03 19:23:44 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			75 lines
		
	
	
		
			3.0 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			75 lines
		
	
	
		
			3.0 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
# coding: utf-8
 | 
						||
from __future__ import unicode_literals
 | 
						||
 | 
						||
from .common import InfoExtractor
 | 
						||
from ..compat import compat_str
 | 
						||
from ..utils import (
 | 
						||
    ExtractorError,
 | 
						||
    traverse_obj,
 | 
						||
    try_get,
 | 
						||
)
 | 
						||
 | 
						||
 | 
						||
class CallinIE(InfoExtractor):
 | 
						||
    _VALID_URL = r'https?://(?:www\.)?callin\.com/episode/(?:[^/#?-]+-)*(?P<id>[^/#?-]+)'
 | 
						||
    _TESTS = [{
 | 
						||
        'url': 'https://www.callin.com/episode/fcc-commissioner-brendan-carr-on-elons-PrumRdSQJW',
 | 
						||
        'md5': '14ede27ee2c957b7e4db93140fc0745c',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'PrumRdSQJW',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'FCC Commissioner Brendan Carr on Elon’s Starlink',
 | 
						||
            'description': 'Or, why the government doesn’t like SpaceX',
 | 
						||
            'channel': 'The Pull Request',
 | 
						||
            'channel_url': 'https://callin.com/show/the-pull-request-ucnDJmEKAa',
 | 
						||
        }
 | 
						||
    }, {
 | 
						||
        'url': 'https://www.callin.com/episode/episode-81-elites-melt-down-over-student-debt-lzxMidUnjA',
 | 
						||
        'md5': '16f704ddbf82a27e3930533b12062f07',
 | 
						||
        'info_dict': {
 | 
						||
            'id': 'lzxMidUnjA',
 | 
						||
            'ext': 'mp4',
 | 
						||
            'title': 'Episode 81- Elites MELT DOWN over Student Debt Victory? Rumble in NYC?',
 | 
						||
            'description': 'Let’s talk todays episode about the primary election shake up in NYC and the elites melting down over student debt cancelation.',
 | 
						||
            'channel': 'The DEBRIEF With Briahna Joy Gray',
 | 
						||
            'channel_url': 'https://callin.com/show/the-debrief-with-briahna-joy-gray-siiFDzGegm',
 | 
						||
        }
 | 
						||
    }]
 | 
						||
 | 
						||
    def _search_nextjs_data(self, webpage, video_id, transform_source=None, fatal=True, **kw):
 | 
						||
        return self._parse_json(
 | 
						||
            self._search_regex(
 | 
						||
                r'(?s)<script[^>]+id=[\'"]__NEXT_DATA__[\'"][^>]*>([^<]+)</script>',
 | 
						||
                webpage, 'next.js data', fatal=fatal, **kw),
 | 
						||
            video_id, transform_source=transform_source, fatal=fatal)
 | 
						||
 | 
						||
    def _real_extract(self, url):
 | 
						||
        video_id = self._match_id(url)
 | 
						||
        webpage = self._download_webpage(url, video_id)
 | 
						||
 | 
						||
        next_data = self._search_nextjs_data(webpage, video_id)
 | 
						||
        episode = traverse_obj(next_data, ('props', 'pageProps', 'episode'), expected_type=dict)
 | 
						||
        if not episode:
 | 
						||
            raise ExtractorError('Failed to find episode data')
 | 
						||
 | 
						||
        title = episode.get('title') or self._og_search_title(webpage)
 | 
						||
        description = episode.get('description') or self._og_search_description(webpage)
 | 
						||
 | 
						||
        formats = []
 | 
						||
        formats.extend(self._extract_m3u8_formats(
 | 
						||
            episode.get('m3u8'), video_id, 'mp4',
 | 
						||
            entry_protocol='m3u8_native', fatal=False))
 | 
						||
        self._sort_formats(formats)
 | 
						||
 | 
						||
        channel = try_get(episode, lambda x: x['show']['title'], compat_str)
 | 
						||
        channel_url = try_get(episode, lambda x: x['show']['linkObj']['resourceUrl'], compat_str)
 | 
						||
 | 
						||
        return {
 | 
						||
            'id': video_id,
 | 
						||
            'title': title,
 | 
						||
            'description': description,
 | 
						||
            'formats': formats,
 | 
						||
            'channel': channel,
 | 
						||
            'channel_url': channel_url,
 | 
						||
        }
 |