1
0
mirror of https://github.com/ytdl-org/youtube-dl.git synced 2025-01-10 19:48:57 +00:00

[ceskatelevize] Fix video availability check and add geo unrestricted test

This commit is contained in:
Sergey M․ 2014-03-01 22:54:37 +07:00
parent f00fc78674
commit 7d78f0cc48

View File

@ -16,7 +16,8 @@ from ..utils import (
class CeskaTelevizeIE(InfoExtractor):
_VALID_URL = r'https?://www\.ceskatelevize\.cz/(porady|ivysilani)/(.+/)?(?P<id>[^?#]+)'
_TESTS = [{
_TESTS = [
{
'url': 'http://www.ceskatelevize.cz/ivysilani/10532695142-prvni-republika/213512120230004-spanelska-chripka',
'info_dict': {
'id': '213512120230004',
@ -28,7 +29,8 @@ class CeskaTelevizeIE(InfoExtractor):
'skip_download': True, # requires rtmpdump
},
'skip': 'Works only from Czech Republic.',
}, {
},
{
'url': 'http://www.ceskatelevize.cz/ivysilani/1030584952-tsatsiki-maminka-a-policajt',
'info_dict': {
'id': '20138143440',
@ -40,7 +42,20 @@ class CeskaTelevizeIE(InfoExtractor):
'skip_download': True, # requires rtmpdump
},
'skip': 'Works only from Czech Republic.',
}]
},
{
'url': 'http://www.ceskatelevize.cz/ivysilani/10532695142-prvni-republika/bonus/14716-zpevacka-z-duparny-bobina',
'info_dict': {
'id': '14716',
'ext': 'flv',
'title': 'První republika: Zpěvačka z Dupárny Bobina',
'duration': 90,
},
'params': {
'skip_download': True, # requires rtmpdump
},
},
]
def _real_extract(self, url):
url = url.replace('/porady/', '/ivysilani/').replace('/video/', '')
@ -50,9 +65,9 @@ class CeskaTelevizeIE(InfoExtractor):
webpage = self._download_webpage(url, video_id)
if '<p class="title">Chyba konfigurace prohlížeče.</p>' not in webpage:
msg = self._html_search_regex(r'<p class="title">(.+?)</p>', webpage, 'error-message')
raise ExtractorError(msg.replace('<br />', ' '))
NOT_AVAILABLE_STRING = 'This content is not available at your territory due to limited copyright.'
if '%s</p>' % NOT_AVAILABLE_STRING in webpage:
raise ExtractorError(NOT_AVAILABLE_STRING, expected=True)
typ = self._html_search_regex(r'getPlaylistUrl\(\[\{"type":"(.+?)","id":".+?"\}\],', webpage, 'type')
episode_id = self._html_search_regex(r'getPlaylistUrl\(\[\{"type":".+?","id":"(.+?)"\}\],', webpage, 'episode_id')