mirror of
https://github.com/ytdl-org/youtube-dl.git
synced 2024-11-22 18:22:21 +00:00
62 lines
2.3 KiB
Python
62 lines
2.3 KiB
Python
# coding: utf-8
|
|
from __future__ import unicode_literals
|
|
|
|
from .turner import TurnerBaseIE
|
|
from ..utils import int_or_none
|
|
|
|
|
|
class CartoonNetworkIE(TurnerBaseIE):
|
|
_VALID_URL = r'https?://(?:www\.)?cartoonnetwork\.com/video/(?:[^/]+/)+(?P<id>[^/?#]+)-(?:clip|episode)\.html'
|
|
_TEST = {
|
|
'url': 'https://www.cartoonnetwork.com/video/ben-10/how-to-draw-upgrade-episode.html',
|
|
'info_dict': {
|
|
'id': '6e3375097f63874ebccec7ef677c1c3845fa850e',
|
|
'ext': 'mp4',
|
|
'title': 'How to Draw Upgrade',
|
|
'description': 'md5:2061d83776db7e8be4879684eefe8c0f',
|
|
},
|
|
'params': {
|
|
# m3u8 download
|
|
'skip_download': True,
|
|
},
|
|
}
|
|
|
|
def _real_extract(self, url):
|
|
display_id = self._match_id(url)
|
|
webpage = self._download_webpage(url, display_id)
|
|
|
|
def find_field(global_re, name, content_re=None, value_re='[^"]+', fatal=False):
|
|
metadata_re = ''
|
|
if content_re:
|
|
metadata_re = r'|video_metadata\.content_' + content_re
|
|
return self._search_regex(
|
|
r'(?:_cnglobal\.currentVideo\.%s%s)\s*=\s*"(%s)";' % (global_re, metadata_re, value_re),
|
|
webpage, name, fatal=fatal)
|
|
|
|
media_id = find_field('mediaId', 'media id', 'id', '[0-9a-f]{40}', True)
|
|
title = find_field('episodeTitle', 'title', '(?:episodeName|name)', fatal=True)
|
|
|
|
info = self._extract_ngtv_info(
|
|
media_id, {'networkId': 'cartoonnetwork'}, {
|
|
'url': url,
|
|
'site_name': 'CartoonNetwork',
|
|
'auth_required': find_field('authType', 'auth type') != 'unauth',
|
|
})
|
|
|
|
series = find_field(
|
|
'propertyName', 'series', 'showName') or self._html_search_meta('partOfSeries', webpage)
|
|
info.update({
|
|
'id': media_id,
|
|
'display_id': display_id,
|
|
'title': title,
|
|
'description': self._html_search_meta('description', webpage),
|
|
'series': series,
|
|
'episode': title,
|
|
})
|
|
|
|
for field in ('season', 'episode'):
|
|
field_name = field + 'Number'
|
|
info[field + '_number'] = int_or_none(find_field(
|
|
field_name, field + ' number', value_re=r'\d+') or self._html_search_meta(field_name, webpage))
|
|
|
|
return info
|