mirror of
https://github.com/ytdl-org/youtube-dl.git
synced 2024-11-16 20:47:37 +00:00
Extract further fields; implement some review comments
This commit is contained in:
parent
35081ecf00
commit
3918da628d
1 changed files with 66 additions and 17 deletions
|
@ -2,39 +2,88 @@
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
|
from ..utils import (
|
||||||
|
clean_html,
|
||||||
|
float_or_none,
|
||||||
|
parse_iso8601,
|
||||||
|
str_or_none,
|
||||||
|
str_to_int,
|
||||||
|
try_get,
|
||||||
|
url_or_none,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class TeleportalIE(InfoExtractor):
|
class TeleportalIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?teleportal\.ua(/ua)?/(?P<id>[0-9a-z-/]+)'
|
_VALID_URL = r'https?://(?:www\.)?teleportal\.ua/(?:ua/)?(?P<id>[0-9a-z-]+(?:/[0-9a-z-]+)*)'
|
||||||
_TEST = {
|
_TEST = {
|
||||||
'url': 'https://teleportal.ua/ua/show/stb/master-cheff/bitva-sezonov/vypusk-3',
|
'url': 'https://teleportal.ua/ua/show/stb/master-cheff/bitva-sezonov/vypusk-3',
|
||||||
'md5': '07bd056c45b515fa9cc0202b8403df41',
|
# no permanent check on file contents as HLS may vary
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': 'show/stb/master-cheff/bitva-sezonov/vypusk-3',
|
'id': 'show/stb/master-cheff/bitva-sezonov/vypusk-3',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'МастерШеф. Битва сезонів 3 випуск: найогидніший випуск сезону!',
|
'title': 'МастерШеф. Битва сезонів 3 випуск: найогидніший випуск сезону!',
|
||||||
'thumbnail': r're:^https?://.*\.jpg$',
|
'display_id': '2618466',
|
||||||
'description': r're:^<p>Не пропустіть.*',
|
'description': 'md5:4179bcc3a12edfa2f655888cd741ac09',
|
||||||
}
|
'timestamp': 1644102480,
|
||||||
|
'upload_date': '20220205',
|
||||||
|
'thumbnail': r're:^https?://.+\.jpg$',
|
||||||
|
'release_timestamp': 1643994000,
|
||||||
|
'duration': 11254.0,
|
||||||
|
'series_id': '20632',
|
||||||
|
'series': 'МастерШеф. Битва сезонів 3 випуск: найогидніший випуск сезону!',
|
||||||
|
'season': 'Битва сезонів',
|
||||||
|
'episode': 'Найогидніший випуск сезону!',
|
||||||
|
'episode_num': 3,
|
||||||
|
'categories': ['Шоу'],
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'hls_prefer_native': True,
|
||||||
|
# 'skip_download': True,
|
||||||
|
},
|
||||||
}
|
}
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
backend_url = 'https://tp-back.starlight.digital/ua/{}'.format(video_id)
|
backend_url = 'https://tp-back.starlight.digital/ua/' + video_id
|
||||||
metadata = self._download_json(backend_url, video_id)
|
series_metadata = self._download_json(backend_url, video_id) or {}
|
||||||
api_metadata = self._download_json('https://vcms-api2.starlight.digital/player-api/{}?referer=https://teleportal.ua/&lang=ua'.format(metadata['hash']), video_id)
|
title = series_metadata['title']
|
||||||
|
_hash = series_metadata.get('hash', '')
|
||||||
|
api_url = 'https://vcms-api2.starlight.digital/player-api/' + _hash
|
||||||
|
api_metadata = self._download_json(
|
||||||
|
api_url, video_id,
|
||||||
|
query={
|
||||||
|
'referer': 'https://teleportal.ua/',
|
||||||
|
'lang': 'ua',
|
||||||
|
}
|
||||||
|
)
|
||||||
|
video_info = api_metadata['video'][0]
|
||||||
|
formats = []
|
||||||
|
for media in ('mediaHlsNoAdv', 'mediaHls'):
|
||||||
|
media = url_or_none(try_get(video_info, lambda x: x[media]))
|
||||||
|
if not media:
|
||||||
|
continue
|
||||||
|
formats.extend(self._extract_m3u8_formats(media, video_id, 'mp4', fatal=False))
|
||||||
|
break
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
try:
|
thumbnail = url_or_none(video_info.get('poster'))
|
||||||
thumbnail = api_metadata['video'][0]['poster']
|
category = series_metadata.get('typeTitle')
|
||||||
except (KeyError, IndexError):
|
|
||||||
thumbnail = None
|
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': metadata.get('title'),
|
'title': title,
|
||||||
'description': metadata.get('description'),
|
'formats': formats,
|
||||||
'real_id': metadata.get('id'),
|
'description': clean_html(series_metadata.get('description')) or series_metadata.get('seoDescription'),
|
||||||
'hash': metadata.get('hash'),
|
'display_id': str_or_none(video_info.get('vcmsId')),
|
||||||
|
'hash': _hash,
|
||||||
'thumbnail': thumbnail,
|
'thumbnail': thumbnail,
|
||||||
'formats': self._extract_m3u8_formats(api_metadata['video'][0]['mediaHls'], video_id, 'mp4'),
|
'timestamp': parse_iso8601(video_info.get('time_upload_video'), delimiter=' '),
|
||||||
|
'release_timestamp': parse_iso8601(video_info.get('publishDate'), delimiter=' '),
|
||||||
|
'duration': float_or_none(video_info.get('duration')),
|
||||||
|
'series_id': str_or_none(series_metadata.get('id')),
|
||||||
|
'series': series_metadata.get('title'),
|
||||||
|
'season': video_info.get('seasonName') or series_metadata.get('seasonGallery', {}).get('title'),
|
||||||
|
'episode': video_info.get('name'),
|
||||||
|
'episode_num': str_to_int(series_metadata.get('seriesTitle')),
|
||||||
|
'categories': [category] if category else None,
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue