# coding: utf-8 from __future__ import unicode_literals import json from .common import InfoExtractor class MegaCartoonsIE(InfoExtractor): _VALID_URL = r'https?://(?:www\.)?megacartoons\.net/(?P[a-z-]+)/' _TEST = { 'url': 'https://www.megacartoons.net/help-wanted/', 'md5': '4ba9be574f9a17abe0c074e2f955fded', 'info_dict': { 'id': 'help-wanted', 'title': 'help-wanted', 'ext': 'mp4', 'thumbnail': r're:^https?://.*\.jpg$', 'description': 'Help Wanted: Encouraged by his best friend, Patrick Starfish, SpongeBob overcomes his fears and finally applies for that dream job as a fry cook at the Krusty Krab. Challenged by the owner, Mr. Krabs, and his assistant Squidward, to prove himself worthy of the job, SpongeBob rises to the occasion, with the help of one very special spatula, by feeding a sea of ravenous anchovies.' } } def _real_extract(self, url): video_id = self._match_id(url) webpage = self._download_webpage(url, video_id) # The id is equal to the title title = video_id # Video and thumbnail are url_json = json.loads(self._html_search_regex(r'{.*})".*>', webpage, 'videourls')) video_url = url_json['sources'][0]['src'] video_type = url_json['sources'][0]['type'] video_thumbnail = url_json['splash'] video_description = self._html_search_regex(r'

(?P.*)

', webpage, 'videodescription') return { 'id': video_id, 'title': title, 'format': video_type, 'url': video_url, 'thumbnail': video_thumbnail, 'description': video_description, }