[paramount] Add new extractor

2025-07-12 21:36:19 +00:00 · 2017-09-20 18:09:06 +02:00 · 2017-09-20 18:09:06 +02:00 · 5ec34dc1f3
commit 5ec34dc1f3
parent 3b65a6fbf3
2 changed files with 93 additions and 0 deletions
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@ -778,6 +778,7 @@ from .packtpub import (
 )
 from .pandatv import PandaTVIE
 from .pandoratv import PandoraTVIE
+from .paramount import ParamountIE
 from .parliamentliveuk import ParliamentLiveUKIE
 from .patreon import PatreonIE
 from .pbs import PBSIE
--- a/youtube_dl/extractor/paramount.py
+++ b/youtube_dl/extractor/paramount.py
@ -0,0 +1,92 @@
+# youtube_dl extractor for www.paramountchannel.it
+
+# copy to youtube_dl/extractors
+# add a line to extractors.py:
+#        from .paramount import ParamountIE
+
+# can use functions from common.py, as _self.function(...)
+# also import from other modules
+
+# to test:
+# python -m youtube_dl --verbose "http://www.paramountchannel.it/playlist/speciali-paramount-channel/o3gr12/backstage-sigla-paramount/tqvbxd" >| x
+# python test/test_download.py TestDownload.test_Paramount
+
+# coding: utf-8
+from __future__ import unicode_literals
+
+from .common import InfoExtractor
+from ..utils import int_or_none
+
+
+class ParamountIE(InfoExtractor):
+    IE_DESC = 'Paramount Channel'
+    _VALID_URL = r'http://(www\.)?paramountchannel\.it/.*/[0-9a-z]{6}'
+
+    _TEST = {
+        'url': 'http://www.paramountchannel.it/playlist/speciali-paramount-channel/o3gr12/backstage-sigla-paramount/tqvbxd',
+        'md5': '433666e341a57bb76dc50b6ff87e5c63',
+        'info_dict': {
+            'id': '9cb5ad60-9d34-4a9a-99df-157fdd1a5310',
+            'ext': 'mp4',
+            'title': 'Speciali video, Paramount Channel',
+            'description': 'Tutti gli speciali di Paramount Channel: curiosità, approfondimenti e aggiornamenti su film, serie tv e personaggi del cinema.'
+        }
+    }
+
+    def _obtain_akamaihd_formats(self, url):
+        if self._downloader.params.get('verbose', False):
+            listpage = self._download_webpage(url, 'akamaihd format list')
+            self.to_screen('formats page = %s' % (listpage))
+        listpage = self._download_xml(url, 'akamaihd format list')
+        formats = []
+        for rendition in listpage.findall('./video/item/rendition'):
+            fmt = {
+                'width': int_or_none(rendition.get('width')),
+                'height': int_or_none(rendition.get('height')),
+                'url': rendition.find('./src').text
+            }
+            formats.append(fmt)
+        return formats
+
+    def _real_extract(self, url):
+        # webpage
+
+        webpage = self._download_webpage(url, 'webpage')
+
+        id = self._html_search_regex(
+            r'data-mtv-id="([0-9a-f-]*)"',
+            webpage, 'id', fatal=False) \
+            or \
+            self._html_search_regex(
+            r'"item_longId" *: *"([0-9a-f-]*)"',
+            webpage, 'id')
+        self.to_screen('id = %s' % (id))
+
+        uri = self._html_search_regex(
+            r'data-mtv-uri="([0-9a-z:\.-]*)"',
+            webpage, 'uri', fatal=False) \
+            or \
+            'mgid:arc:video:paramountchannel.it:' + id
+        self.to_screen('uri = %s' % (uri))
+
+        title = self._og_search_title(webpage)
+        self.to_screen('title = %s' % (title))
+
+        # list of formats
+
+        server = 'https://mediautilssvcs-a.akamaihd.net'
+        prefix = '/services/MediaGenerator/'
+        arguments = 'accountOverride=esperanto.mtvi.com'
+        listurl = '%s%s%s?%s' % (server, prefix, uri, arguments)
+        self.to_screen('listurl = %s' % (listurl))
+        formats = self._obtain_akamaihd_formats(listurl)
+        if self._downloader.params.get('verbose', False):
+            self.to_screen('formats = %s' % (formats))
+
+        return {
+            'id': id,
+            'formats': formats,
+            'title': title,
+            'description': self._og_search_description(webpage),
+            'thumbnail': self._html_search_meta('thumbnail', webpage, fatal=False)
+        }