[paramount] Add new extractor

2025-07-12 21:36:19 +00:00 · 2017-09-20 18:09:06 +02:00 · 2017-09-20 18:09:06 +02:00 · 5ec34dc1f3
commit 5ec34dc1f3
parent 3b65a6fbf3
2 changed files with 93 additions and 0 deletions
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@ -778,6 +778,7 @@ from .packtpub import (
 )
 from .pandatv import PandaTVIE
 from .pandoratv import PandoraTVIE
 from .paramount import ParamountIE
 from .parliamentliveuk import ParliamentLiveUKIE
 from .patreon import PatreonIE
 from .pbs import PBSIE
--- a/youtube_dl/extractor/paramount.py
+++ b/youtube_dl/extractor/paramount.py
@ -0,0 +1,92 @@
 # youtube_dl extractor for www.paramountchannel.it
 # copy to youtube_dl/extractors
 # add a line to extractors.py:
 #        from .paramount import ParamountIE
 # can use functions from common.py, as _self.function(...)
 # also import from other modules
 # to test:
 # python -m youtube_dl --verbose "http://www.paramountchannel.it/playlist/speciali-paramount-channel/o3gr12/backstage-sigla-paramount/tqvbxd" >| x
 # python test/test_download.py TestDownload.test_Paramount
 # coding: utf-8
 from __future__ import unicode_literals
 from .common import InfoExtractor
 from ..utils import int_or_none
 class ParamountIE(InfoExtractor):
    IE_DESC = 'Paramount Channel'
    _VALID_URL = r'http://(www\.)?paramountchannel\.it/.*/[0-9a-z]{6}'
    _TEST = {
        'url': 'http://www.paramountchannel.it/playlist/speciali-paramount-channel/o3gr12/backstage-sigla-paramount/tqvbxd',
        'md5': '433666e341a57bb76dc50b6ff87e5c63',
        'info_dict': {
            'id': '9cb5ad60-9d34-4a9a-99df-157fdd1a5310',
            'ext': 'mp4',
            'title': 'Speciali video, Paramount Channel',
            'description': 'Tutti gli speciali di Paramount Channel: curiosità, approfondimenti e aggiornamenti su film, serie tv e personaggi del cinema.'
        }
    }
    def _obtain_akamaihd_formats(self, url):
        if self._downloader.params.get('verbose', False):
            listpage = self._download_webpage(url, 'akamaihd format list')
            self.to_screen('formats page = %s' % (listpage))
        listpage = self._download_xml(url, 'akamaihd format list')
        formats = []
        for rendition in listpage.findall('./video/item/rendition'):
            fmt = {
                'width': int_or_none(rendition.get('width')),
                'height': int_or_none(rendition.get('height')),
                'url': rendition.find('./src').text
            }
            formats.append(fmt)
        return formats
    def _real_extract(self, url):
        # webpage
        webpage = self._download_webpage(url, 'webpage')
        id = self._html_search_regex(
            r'data-mtv-id="([0-9a-f-]*)"',
            webpage, 'id', fatal=False) \
            or \
            self._html_search_regex(
            r'"item_longId" *: *"([0-9a-f-]*)"',
            webpage, 'id')
        self.to_screen('id = %s' % (id))
        uri = self._html_search_regex(
            r'data-mtv-uri="([0-9a-z:\.-]*)"',
            webpage, 'uri', fatal=False) \
            or \
            'mgid:arc:video:paramountchannel.it:' + id
        self.to_screen('uri = %s' % (uri))
        title = self._og_search_title(webpage)
        self.to_screen('title = %s' % (title))
        # list of formats
        server = 'https://mediautilssvcs-a.akamaihd.net'
        prefix = '/services/MediaGenerator/'
        arguments = 'accountOverride=esperanto.mtvi.com'
        listurl = '%s%s%s?%s' % (server, prefix, uri, arguments)
        self.to_screen('listurl = %s' % (listurl))
        formats = self._obtain_akamaihd_formats(listurl)
        if self._downloader.params.get('verbose', False):
            self.to_screen('formats = %s' % (formats))
        return {
            'id': id,
            'formats': formats,
            'title': title,
            'description': self._og_search_description(webpage),
            'thumbnail': self._html_search_meta('thumbnail', webpage, fatal=False)
        }