youtube-dl/youtube_dl/extractor/adultswim.py

# coding: utf-8
from __future__ import unicode_literals

import re

from .turner import TurnerBaseIE
from ..utils import (
    int_or_none,
    strip_or_none,
)


class AdultSwimIE(TurnerBaseIE):
    _VALID_URL = r'https?://(?:www\.)?adultswim\.com/videos/(?P<show_path>[^/?#]+)(?:/(?P<episode_path>[^/?#]+))?'

    _TESTS = [{
        'url': 'http://adultswim.com/videos/rick-and-morty/pilot',
        'info_dict': {
            'id': 'rQxZvXQ4ROaSOqq-or2Mow',
            'ext': 'mp4',
            'title': 'Rick and Morty - Pilot',
            'description': 'Rick moves in with his daughter\'s family and establishes himself as a bad influence on his grandson, Morty.',
            'timestamp': 1493267400,
            'upload_date': '20170427',
        },
        'params': {
            # m3u8 download
            'skip_download': True,
        },
        'expected_warnings': ['Unable to download f4m manifest'],
    }, {
        'url': 'http://www.adultswim.com/videos/tim-and-eric-awesome-show-great-job/dr-steve-brule-for-your-wine/',
        'info_dict': {
            'id': 'sY3cMUR_TbuE4YmdjzbIcQ',
            'ext': 'mp4',
            'title': 'Tim and Eric Awesome Show Great Job! - Dr. Steve Brule, For Your Wine',
            'description': 'Dr. Brule reports live from Wine Country with a special report on wines.  \nWatch Tim and Eric Awesome Show Great Job! episode #20, "Embarrassed" on Adult Swim.',
            'upload_date': '20080124',
            'timestamp': 1201150800,
        },
        'params': {
            # m3u8 download
            'skip_download': True,
        },
    }, {
        'url': 'http://www.adultswim.com/videos/decker/inside-decker-a-new-hero/',
        'info_dict': {
            'id': 'I0LQFQkaSUaFp8PnAWHhoQ',
            'ext': 'mp4',
            'title': 'Decker - Inside Decker: A New Hero',
            'description': 'The guys recap the conclusion of the season. They announce a new hero, take a peek into the Victorville Film Archive and welcome back the talented James Dean.',
            'timestamp': 1469480460,
            'upload_date': '20160725',
        },
        'params': {
            # m3u8 download
            'skip_download': True,
        },
        'expected_warnings': ['Unable to download f4m manifest'],
    }, {
        'url': 'http://www.adultswim.com/videos/attack-on-titan',
        'info_dict': {
            'id': 'b7A69dzfRzuaXIECdxW8XQ',
            'title': 'Attack on Titan',
            'description': 'md5:6c8e003ea0777b47013e894767f5e114',
        },
        'playlist_mincount': 12,
    }, {
        'url': 'http://www.adultswim.com/videos/streams/williams-stream',
        'info_dict': {
            'id': 'd8DEBj7QRfetLsRgFnGEyg',
            'ext': 'mp4',
            'title': r're:^Williams Stream \d{4}-\d{2}-\d{2} \d{2}:\d{2}$',
            'description': 'original programming',
        },
        'params': {
            # m3u8 download
            'skip_download': True,
        },
    }]

    def _real_extract(self, url):
        show_path, episode_path = re.match(self._VALID_URL, url).groups()
        display_id = episode_path or show_path
        webpage = self._download_webpage(url, display_id)
        initial_data = self._parse_json(self._search_regex(
            r'AS_INITIAL_DATA(?:__)?\s*=\s*({.+?});',
            webpage, 'initial data'), display_id)

        is_stream = show_path == 'streams'
        if is_stream:
            if not episode_path:
                episode_path = 'live-stream'

            video_data = next(stream for stream_path, stream in initial_data['streams'].items() if stream_path == episode_path)
            video_id = video_data.get('stream')

            if not video_id:
                entries = []
                for episode in video_data.get('archiveEpisodes', []):
                    episode_url = episode.get('url')
                    if not episode_url:
                        continue
                    entries.append(self.url_result(
                        episode_url, 'AdultSwim', episode.get('id')))
                return self.playlist_result(
                    entries, video_data.get('id'), video_data.get('title'),
                    strip_or_none(video_data.get('description')))
        else:
            show_data = initial_data['show']

            if not episode_path:
                entries = []
                for video in show_data.get('videos', []):
                    slug = video.get('slug')
                    if not slug:
                        continue
                    entries.append(self.url_result(
                        'http://adultswim.com/videos/%s/%s' % (show_path, slug),
                        'AdultSwim', video.get('id')))
                return self.playlist_result(
                    entries, show_data.get('id'), show_data.get('title'),
                    strip_or_none(show_data.get('metadata', {}).get('description')))

            video_data = show_data['sluggedVideo']
            video_id = video_data['id']

        info = self._extract_cvp_info(
            'http://www.adultswim.com/videos/api/v0/assets?platform=desktop&id=' + video_id,
            video_id, {
                'secure': {
                    'media_src': 'http://androidhls-secure.cdn.turner.com/adultswim/big',
                    'tokenizer_src': 'http://www.adultswim.com/astv/mvpd/processors/services/token_ipadAdobe.do',
                },
            }, {
                'url': url,
                'site_name': 'AdultSwim',
                'auth_required': video_data.get('auth'),
            })

        info.update({
            'id': video_id,
            'display_id': display_id,
            'description': info.get('description') or strip_or_none(video_data.get('description')),
        })
        if not is_stream:
            info.update({
                'duration': info.get('duration') or int_or_none(video_data.get('duration')),
                'timestamp': info.get('timestamp') or int_or_none(video_data.get('launch_date')),
                'season_number': info.get('season_number') or int_or_none(video_data.get('season_number')),
                'episode': info['title'],
                'episode_number': info.get('episode_number') or int_or_none(video_data.get('episode_number')),
            })

            info['series'] = video_data.get('collection_title') or info.get('series')
            if info['series'] and info['series'] != info['title']:
                info['title'] = '%s - %s' % (info['series'], info['title'])

        return info
[adultswim] Add new extractor 2014-05-19 11:25:58 +00:00			`# coding: utf-8`
			`from __future__ import unicode_literals`

			`import re`

[turner,nba,cnn,adultswim] add base extractor to parse cvp feeds 2016-08-28 15:43:15 +00:00			`from .turner import TurnerBaseIE`
[adultswim] Extract video info from onlineOriginals (Closes #10492) 2016-08-29 15:40:35 +00:00			`from ..utils import (`
			`int_or_none,`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`strip_or_none,`
[adultswim] Extract video info from onlineOriginals (Closes #10492) 2016-08-29 15:40:35 +00:00			`)`
[adultswim] Add new extractor 2014-05-19 11:25:58 +00:00
PEP8 applied 2014-11-23 19:41:03 +00:00
[turner,nba,cnn,adultswim] add base extractor to parse cvp feeds 2016-08-28 15:43:15 +00:00			`class AdultSwimIE(TurnerBaseIE):`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`_VALID_URL = r'https?://(?:www\.)?adultswim\.com/videos/(?P<show_path>[^/?#]+)(?:/(?P<episode_path>[^/?#]+))?'`
[adultswim] Updated to work with new site format (fixes #4317) 2014-12-06 05:49:41 +00:00
			`_TESTS = [{`
			`'url': 'http://adultswim.com/videos/rick-and-morty/pilot',`
			`'info_dict': {`
Extend various playlist tests 2015-02-17 23:49:10 +00:00			`'id': 'rQxZvXQ4ROaSOqq-or2Mow',`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'ext': 'mp4',`
[adultswim] Updated to work with new site format (fixes #4317) 2014-12-06 05:49:41 +00:00			`'title': 'Rick and Morty - Pilot',`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'description': 'Rick moves in with his daughter\'s family and establishes himself as a bad influence on his grandson, Morty.',`
			`'timestamp': 1493267400,`
			`'upload_date': '20170427',`
[adultswim] detect when video needs authentication 2015-10-10 11:28:12 +00:00			`},`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'params': {`
			`# m3u8 download`
			`'skip_download': True,`
[adultswim] Updated to work with new site format (fixes #4317) 2014-12-06 05:49:41 +00:00			`},`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'expected_warnings': ['Unable to download f4m manifest'],`
[adultswim] Improve video_info extraction (Fixes #5152) Look for video_info inside `slugged_video`, if slug is not found among collections. Also, simplify a bit. 2015-03-08 19:32:42 +00:00			`}, {`
			`'url': 'http://www.adultswim.com/videos/tim-and-eric-awesome-show-great-job/dr-steve-brule-for-your-wine/',`
			`'info_dict': {`
			`'id': 'sY3cMUR_TbuE4YmdjzbIcQ',`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'ext': 'mp4',`
[adultswim] Improve video_info extraction (Fixes #5152) Look for video_info inside `slugged_video`, if slug is not found among collections. Also, simplify a bit. 2015-03-08 19:32:42 +00:00			`'title': 'Tim and Eric Awesome Show Great Job! - Dr. Steve Brule, For Your Wine',`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'description': 'Dr. Brule reports live from Wine Country with a special report on wines. \nWatch Tim and Eric Awesome Show Great Job! episode #20, "Embarrassed" on Adult Swim.',`
			`'upload_date': '20080124',`
			`'timestamp': 1201150800,`
[adultswim] Improve video_info extraction (Fixes #5152) Look for video_info inside `slugged_video`, if slug is not found among collections. Also, simplify a bit. 2015-03-08 19:32:42 +00:00			`},`
[adultswim] update test 2015-12-21 16:07:19 +00:00			`'params': {`
			`# m3u8 download`
			`'skip_download': True,`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`},`
[adultswim] Add support for trailers (Closes #10235) 2016-08-05 17:00:05 +00:00			`}, {`
			`'url': 'http://www.adultswim.com/videos/decker/inside-decker-a-new-hero/',`
			`'info_dict': {`
			`'id': 'I0LQFQkaSUaFp8PnAWHhoQ',`
			`'ext': 'mp4',`
			`'title': 'Decker - Inside Decker: A New Hero',`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'description': 'The guys recap the conclusion of the season. They announce a new hero, take a peek into the Victorville Film Archive and welcome back the talented James Dean.',`
			`'timestamp': 1469480460,`
			`'upload_date': '20160725',`
[adultswim] Add support for trailers (Closes #10235) 2016-08-05 17:00:05 +00:00			`},`
			`'params': {`
			`# m3u8 download`
			`'skip_download': True,`
[turner,nba,cnn,adultswim] add base extractor to parse cvp feeds 2016-08-28 15:43:15 +00:00			`},`
			`'expected_warnings': ['Unable to download f4m manifest'],`
[adultswim] Fix extraction (closes #10979) 2016-10-26 18:16:48 +00:00			`}, {`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'url': 'http://www.adultswim.com/videos/attack-on-titan',`
			`'info_dict': {`
			`'id': 'b7A69dzfRzuaXIECdxW8XQ',`
			`'title': 'Attack on Titan',`
			`'description': 'md5:6c8e003ea0777b47013e894767f5e114',`
			`},`
			`'playlist_mincount': 12,`
			`}, {`
			`'url': 'http://www.adultswim.com/videos/streams/williams-stream',`
[adultswim] Fix extraction (closes #10979) 2016-10-26 18:16:48 +00:00			`'info_dict': {`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`'id': 'd8DEBj7QRfetLsRgFnGEyg',`
			`'ext': 'mp4',`
			`'title': r're:^Williams Stream \d{4}-\d{2}-\d{2} \d{2}:\d{2}$',`
			`'description': 'original programming',`
[adultswim] Fix extraction (closes #10979) 2016-10-26 18:16:48 +00:00			`},`
			`'params': {`
			`# m3u8 download`
			`'skip_download': True,`
			`},`
[adultswim] Updated to work with new site format (fixes #4317) 2014-12-06 05:49:41 +00:00			`}]`

[adultswim] Add new extractor 2014-05-19 11:25:58 +00:00			`def _real_extract(self, url):`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`show_path, episode_path = re.match(self._VALID_URL, url).groups()`
			`display_id = episode_path or show_path`
			`webpage = self._download_webpage(url, display_id)`
			`initial_data = self._parse_json(self._search_regex(`
			`r'AS_INITIAL_DATA(?:__)?\s=\s({.+?});',`
			`webpage, 'initial data'), display_id)`

			`is_stream = show_path == 'streams'`
			`if is_stream:`
			`if not episode_path:`
			`episode_path = 'live-stream'`

			`video_data = next(stream for stream_path, stream in initial_data['streams'].items() if stream_path == episode_path)`
			`video_id = video_data.get('stream')`

			`if not video_id:`
			`entries = []`
			`for episode in video_data.get('archiveEpisodes', []):`
			`episode_url = episode.get('url')`
			`if not episode_url:`
			`continue`
			`entries.append(self.url_result(`
			`episode_url, 'AdultSwim', episode.get('id')))`
			`return self.playlist_result(`
			`entries, video_data.get('id'), video_data.get('title'),`
			`strip_or_none(video_data.get('description')))`
[adultswim] Updated to work with new site format (fixes #4317) 2014-12-06 05:49:41 +00:00			`else:`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`show_data = initial_data['show']`

			`if not episode_path:`
			`entries = []`
			`for video in show_data.get('videos', []):`
			`slug = video.get('slug')`
			`if not slug:`
			`continue`
			`entries.append(self.url_result(`
			`'http://adultswim.com/videos/%s/%s' % (show_path, slug),`
			`'AdultSwim', video.get('id')))`
			`return self.playlist_result(`
			`entries, show_data.get('id'), show_data.get('title'),`
			`strip_or_none(show_data.get('metadata', {}).get('description')))`

			`video_data = show_data['sluggedVideo']`
			`video_id = video_data['id']`

			`info = self._extract_cvp_info(`
use platform=desktop in assets url(closes #13041) 2017-05-10 07:50:30 +00:00			`'http://www.adultswim.com/videos/api/v0/assets?platform=desktop&id=' + video_id,`
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`video_id, {`
			`'secure': {`
			`'media_src': 'http://androidhls-secure.cdn.turner.com/adultswim/big',`
			`'tokenizer_src': 'http://www.adultswim.com/astv/mvpd/processors/services/token_ipadAdobe.do',`
			`},`
			`}, {`
			`'url': url,`
			`'site_name': 'AdultSwim',`
			`'auth_required': video_data.get('auth'),`
			`})`
[adultswim] Add new extractor 2014-05-19 11:25:58 +00:00
[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`info.update({`
			`'id': video_id,`
			`'display_id': display_id,`
			`'description': info.get('description') or strip_or_none(video_data.get('description')),`
			`})`
			`if not is_stream:`
			`info.update({`
			`'duration': info.get('duration') or int_or_none(video_data.get('duration')),`
			`'timestamp': info.get('timestamp') or int_or_none(video_data.get('launch_date')),`
			`'season_number': info.get('season_number') or int_or_none(video_data.get('season_number')),`
			`'episode': info['title'],`
			`'episode_number': info.get('episode_number') or int_or_none(video_data.get('episode_number')),`
[adultswim] Add new extractor 2014-05-19 11:25:58 +00:00			`})`

[adultswim] Fix Extraction(closes #8640)(closes #10950)(closes closes #11042)(closes #12121) - add support for adobe pass authentication - add support for live streams - add support for show pages 2017-05-08 14:01:10 +00:00			`info['series'] = video_data.get('collection_title') or info.get('series')`
			`if info['series'] and info['series'] != info['title']:`
			`info['title'] = '%s - %s' % (info['series'], info['title'])`

			`return info`