2022-05-16 19:28:19 +00:00
# coding: utf-8
from __future__ import unicode_literals
import json
from . common import InfoExtractor
class MegaCartoonsIE ( InfoExtractor ) :
_VALID_URL = r ' https?://(?:www \ .)?megacartoons \ .net/(?P<id>[a-z-]+)/ '
_TEST = {
' url ' : ' https://www.megacartoons.net/help-wanted/ ' ,
' md5 ' : ' 4ba9be574f9a17abe0c074e2f955fded ' ,
' info_dict ' : {
' id ' : ' help-wanted ' ,
' title ' : ' help-wanted ' ,
' ext ' : ' mp4 ' ,
' thumbnail ' : r ' re:^https?://.* \ .jpg$ ' ,
' description ' : ' Help Wanted: Encouraged by his best friend, Patrick Starfish, SpongeBob overcomes his fears and finally applies for that dream job as a fry cook at the Krusty Krab. Challenged by the owner, Mr. Krabs, and his assistant Squidward, to prove himself worthy of the job, SpongeBob rises to the occasion, with the help of one very special spatula, by feeding a sea of ravenous anchovies. '
}
}
def _real_extract ( self , url ) :
2022-05-16 19:37:35 +00:00
# ID is equal to the episode name
2022-05-16 19:28:19 +00:00
video_id = self . _match_id ( url )
webpage = self . _download_webpage ( url , video_id )
# The id is equal to the title
title = video_id
2022-05-16 19:37:35 +00:00
# Video data is stored in a json -> extract it from the raw html
2022-05-16 19:28:19 +00:00
url_json = json . loads ( self . _html_search_regex ( r ' <div.*data-item= " (?P<videourls> { .*}) " .*> ' , webpage , ' videourls ' ) )
2022-05-16 19:37:35 +00:00
video_url = url_json [ ' sources ' ] [ 0 ] [ ' src ' ] # Get the video url
video_type = url_json [ ' sources ' ] [ 0 ] [ ' type ' ] # Get the video type -> 'video/mp4'
video_thumbnail = url_json [ ' splash ' ] # Get the thumbnail
2022-05-16 19:28:19 +00:00
2022-05-16 19:37:35 +00:00
# Every video has a short summary -> save it as description
2022-05-16 19:28:19 +00:00
video_description = self . _html_search_regex ( r ' <p>(?P<videodescription>.*)</p> ' , webpage , ' videodescription ' )
return {
' id ' : video_id ,
' title ' : title ,
' format ' : video_type ,
' url ' : video_url ,
' thumbnail ' : video_thumbnail ,
' description ' : video_description ,
}