mirror of
https://github.com/yt-dlp/yt-dlp
synced 2025-01-16 03:40:50 +01:00
[ie/vidio] Fix login; use new API; check DRM; extract comments
This commit is contained in:
parent
3bb739f188
commit
20c66ec13e
1 changed files with 293 additions and 79 deletions
|
@ -1,6 +1,7 @@
|
||||||
import base64
|
import base64
|
||||||
import hashlib
|
import hashlib
|
||||||
import hmac
|
import hmac
|
||||||
|
import json
|
||||||
import time
|
import time
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
|
@ -8,13 +9,17 @@ from ..aes import aes_cbc_encrypt
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
clean_html,
|
clean_html,
|
||||||
|
extract_attributes,
|
||||||
format_field,
|
format_field,
|
||||||
get_element_by_class,
|
get_element_by_class,
|
||||||
|
get_element_html_by_id,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
join_nonempty,
|
join_nonempty,
|
||||||
parse_iso8601,
|
parse_iso8601,
|
||||||
|
remove_end,
|
||||||
smuggle_url,
|
smuggle_url,
|
||||||
str_or_none,
|
str_or_none,
|
||||||
|
str_to_int,
|
||||||
strip_or_none,
|
strip_or_none,
|
||||||
try_get,
|
try_get,
|
||||||
unsmuggle_url,
|
unsmuggle_url,
|
||||||
|
@ -44,6 +49,7 @@ class VidioBaseIE(InfoExtractor):
|
||||||
login_form.update({
|
login_form.update({
|
||||||
'user[login]': username,
|
'user[login]': username,
|
||||||
'user[password]': password,
|
'user[password]': password,
|
||||||
|
'authenticity_token': self._html_search_meta('csrf-token', login_page, fatal=True),
|
||||||
})
|
})
|
||||||
login_post, login_post_urlh = self._download_webpage_handle(
|
login_post, login_post_urlh = self._download_webpage_handle(
|
||||||
self._LOGIN_URL, None, 'Logging in', data=urlencode_postdata(login_form), expected_status=[302, 401])
|
self._LOGIN_URL, None, 'Logging in', data=urlencode_postdata(login_form), expected_status=[302, 401])
|
||||||
|
@ -77,7 +83,9 @@ class VidioBaseIE(InfoExtractor):
|
||||||
|
|
||||||
|
|
||||||
class VidioIE(VidioBaseIE):
|
class VidioIE(VidioBaseIE):
|
||||||
|
_GEO_COUNTRIES = ['ID']
|
||||||
_VALID_URL = r'https?://(?:www\.)?vidio\.com/(watch|embed)/(?P<id>\d+)-(?P<display_id>[^/?#&]+)'
|
_VALID_URL = r'https?://(?:www\.)?vidio\.com/(watch|embed)/(?P<id>\d+)-(?P<display_id>[^/?#&]+)'
|
||||||
|
_EMBED_REGEX = [rf'(?x)<iframe[^>]+\bsrc=[\'"](?P<url>{_VALID_URL})']
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.vidio.com/watch/165683-dj_ambred-booyah-live-2015',
|
'url': 'http://www.vidio.com/watch/165683-dj_ambred-booyah-live-2015',
|
||||||
'md5': 'abac81b1a205a8d94c609a473b5ea62a',
|
'md5': 'abac81b1a205a8d94c609a473b5ea62a',
|
||||||
|
@ -87,113 +95,319 @@ class VidioIE(VidioBaseIE):
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'DJ_AMBRED - Booyah (Live 2015)',
|
'title': 'DJ_AMBRED - Booyah (Live 2015)',
|
||||||
'description': 'md5:27dc15f819b6a78a626490881adbadf8',
|
'description': 'md5:27dc15f819b6a78a626490881adbadf8',
|
||||||
'thumbnail': r're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
'duration': 149,
|
'duration': 149,
|
||||||
'like_count': int,
|
'uploader': 'twelvepictures',
|
||||||
'uploader': 'TWELVE Pic',
|
'timestamp': 1444902960,
|
||||||
'timestamp': 1444902800,
|
|
||||||
'upload_date': '20151015',
|
'upload_date': '20151015',
|
||||||
'uploader_id': 'twelvepictures',
|
'uploader_id': '270115',
|
||||||
'channel': 'Cover Music Video',
|
'channel': 'cover-music-video',
|
||||||
'channel_id': '280236',
|
'channel_id': '280236',
|
||||||
'view_count': int,
|
'channel_url': 'https://www.vidio.com/@twelvepictures/channels/280236-cover-music-video',
|
||||||
'dislike_count': int,
|
|
||||||
'comment_count': int,
|
|
||||||
'tags': 'count:3',
|
'tags': 'count:3',
|
||||||
'uploader_url': 'https://www.vidio.com/@twelvepictures',
|
'uploader_url': 'https://www.vidio.com/@twelvepictures',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['vlog', 'comedy', 'edm'],
|
||||||
|
'season_id': '',
|
||||||
|
'season_name': '',
|
||||||
|
'age_limit': 13,
|
||||||
|
'comment_count': int,
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'getcomments': True,
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
|
# DRM protected
|
||||||
|
'url': 'https://www.vidio.com/watch/7095853-ep-04-sketch-book',
|
||||||
|
'md5': 'abac81b1a205a8d94c609a473b5ea62a',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '7095853',
|
||||||
|
'display_id': 'ep-04-sketch-book',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Ep 04 - Sketch Book',
|
||||||
|
'description': 'md5:9e22b4b1dbd65209c143d7009e899830',
|
||||||
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
|
'duration': 2784,
|
||||||
|
'uploader': 'vidiooriginal',
|
||||||
|
'timestamp': 1658509200,
|
||||||
|
'upload_date': '20220722',
|
||||||
|
'uploader_id': '31052580',
|
||||||
|
'channel': 'cupcake-untuk-rain',
|
||||||
|
'channel_id': '52332655',
|
||||||
|
'channel_url': 'https://www.vidio.com/@vidiooriginal/channels/52332655-cupcake-untuk-rain',
|
||||||
|
'tags': [],
|
||||||
|
'uploader_url': 'https://www.vidio.com/@vidiooriginal',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['romance', 'drama', 'comedy', 'Teen', 'love triangle'],
|
||||||
|
'season_id': '8220',
|
||||||
|
'season_name': 'Season 1',
|
||||||
|
'age_limit': 13,
|
||||||
|
'availability': 'premium_only',
|
||||||
|
'comment_count': int,
|
||||||
|
},
|
||||||
|
'expected_warnings': ['This video is DRM protected'],
|
||||||
|
'params': {
|
||||||
|
'getcomments': True,
|
||||||
|
'skip_download': True,
|
||||||
|
'ignore_no_formats_error': True,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.vidio.com/watch/7439193-episode-1-magic-5',
|
||||||
|
'md5': 'b1644c574aeb20c91503be367ac2d211',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '7439193',
|
||||||
|
'display_id': 'episode-1-magic-5',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Episode 1 - Magic 5',
|
||||||
|
'description': 'md5:367255f9e8e7ad7192c26218f01b6260',
|
||||||
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
|
'duration': 6126,
|
||||||
|
'uploader': 'indosiar',
|
||||||
|
'timestamp': 1679315400,
|
||||||
|
'upload_date': '20230320',
|
||||||
|
'uploader_id': '12',
|
||||||
|
'channel': 'magic-5',
|
||||||
|
'channel_id': '52350795',
|
||||||
|
'channel_url': 'https://www.vidio.com/@indosiar/channels/52350795-magic-5',
|
||||||
|
'tags': ['basmalah', 'raden-rakha', 'eby-da-5', 'sinetron', 'afan-da-5', 'sridevi-da5'],
|
||||||
|
'uploader_url': 'https://www.vidio.com/@indosiar',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['drama', 'fantasy', 'friendship'],
|
||||||
|
'season_id': '11017',
|
||||||
|
'season_name': 'Episode',
|
||||||
|
'age_limit': 13,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.vidio.com/watch/1716926-mas-suka-masukin-aja',
|
||||||
|
'md5': 'acc4009eeac0033328419aada7bc6925',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '1716926',
|
||||||
|
'display_id': 'mas-suka-masukin-aja',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Mas Suka, Masukin Aja',
|
||||||
|
'description': 'md5:667093b08e07b6fb92f68037f81f2267',
|
||||||
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
|
'duration': 5080,
|
||||||
|
'uploader': 'vidiopremier',
|
||||||
|
'timestamp': 1564735560,
|
||||||
|
'upload_date': '20190802',
|
||||||
|
'uploader_id': '26094842',
|
||||||
|
'channel': 'mas-suka-masukin-aja',
|
||||||
|
'channel_id': '34112289',
|
||||||
|
'channel_url': 'https://www.vidio.com/@vidiopremier/channels/34112289-mas-suka-masukin-aja',
|
||||||
|
'tags': [],
|
||||||
|
'uploader_url': 'https://www.vidio.com/@vidiopremier',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['comedy', 'romance'],
|
||||||
|
'season_id': '663',
|
||||||
|
'season_name': '',
|
||||||
|
'age_limit': 18,
|
||||||
|
'availability': 'premium_only',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'ignore_no_formats_error': True,
|
||||||
|
},
|
||||||
|
'expected_warnings': ['This show isn\'t available in your country'],
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.vidio.com/watch/2372948-first-day-of-school-kindergarten-life-song-beabeo-nursery-rhymes-kids-songs',
|
||||||
|
'md5': 'c6d1bde08eee88bea27cca9dc38bc3df',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '2372948',
|
||||||
|
'display_id': 'first-day-of-school-kindergarten-life-song-beabeo-nursery-rhymes-kids-songs',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'First Day of School | Kindergarten Life Song | BeaBeo Nursery Rhymes & Kids Songs',
|
||||||
|
'description': 'md5:d505486a67415903f7f3ab61adfd5a91',
|
||||||
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
|
'duration': 517,
|
||||||
|
'uploader': 'kidsstartv',
|
||||||
|
'timestamp': 1638518400,
|
||||||
|
'upload_date': '20211203',
|
||||||
|
'uploader_id': '38247189',
|
||||||
|
'channel': 'beabeo-school-series',
|
||||||
|
'channel_id': '52311987',
|
||||||
|
'channel_url': 'https://www.vidio.com/@kidsstartv/channels/52311987-beabeo-school-series',
|
||||||
|
'tags': [],
|
||||||
|
'uploader_url': 'https://www.vidio.com/@kidsstartv',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['animation', 'Cartoon'],
|
||||||
|
'season_id': '6023',
|
||||||
|
'season_name': 'school series',
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.vidio.com/watch/1550718-stand-by-me-doraemon',
|
||||||
|
'md5': '405b61a2f06c74e052e0bd67cad6b891',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '1550718',
|
||||||
|
'display_id': 'stand-by-me-doraemon',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Stand by Me Doraemon',
|
||||||
|
'description': 'md5:673d899f6a58dd4b0d18aebe30545e2a',
|
||||||
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
|
'duration': 5429,
|
||||||
|
'uploader': 'vidiopremier',
|
||||||
|
'timestamp': 1545815634,
|
||||||
|
'upload_date': '20181226',
|
||||||
|
'uploader_id': '26094842',
|
||||||
|
'channel': 'stand-by-me-doraemon',
|
||||||
|
'channel_id': '29750953',
|
||||||
|
'channel_url': 'https://www.vidio.com/@vidiopremier/channels/29750953-stand-by-me-doraemon',
|
||||||
|
'tags': ['anime-lucu', 'top-10-this-week', 'kids', 'stand-by-me-doraemon-2'],
|
||||||
|
'uploader_url': 'https://www.vidio.com/@vidiopremier',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['anime', 'family', 'adventure', 'comedy', 'coming of age'],
|
||||||
|
'season_id': '237',
|
||||||
|
'season_name': '',
|
||||||
|
'age_limit': 7,
|
||||||
|
'availability': 'premium_only',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'ignore_no_formats_error': True,
|
||||||
|
},
|
||||||
|
'expected_warnings': ['This show isn\'t available in your country'],
|
||||||
|
}, {
|
||||||
|
# 404 Not Found
|
||||||
'url': 'https://www.vidio.com/watch/77949-south-korea-test-fires-missile-that-can-strike-all-of-the-north',
|
'url': 'https://www.vidio.com/watch/77949-south-korea-test-fires-missile-that-can-strike-all-of-the-north',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
}, {
|
}]
|
||||||
# Premier-exclusive video
|
_WEBPAGE_TESTS = [{
|
||||||
'url': 'https://www.vidio.com/watch/1550718-stand-by-me-doraemon',
|
# embed player: https://www.vidio.com/embed/7115874-fakta-temuan-suspek-cacar-monyet-di-jawa-tengah
|
||||||
'only_matching': True,
|
'url': 'https://enamplus.liputan6.com/read/5033648/video-fakta-temuan-suspek-cacar-monyet-di-jawa-tengah',
|
||||||
}, {
|
|
||||||
# embed url from https://enamplus.liputan6.com/read/5033648/video-fakta-temuan-suspek-cacar-monyet-di-jawa-tengah
|
|
||||||
'url': 'https://www.vidio.com/embed/7115874-fakta-temuan-suspek-cacar-monyet-di-jawa-tengah',
|
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '7115874',
|
'id': '7115874',
|
||||||
'ext': 'mp4',
|
|
||||||
'channel_id': '40172876',
|
|
||||||
'comment_count': int,
|
|
||||||
'uploader_id': 'liputan6',
|
|
||||||
'view_count': int,
|
|
||||||
'dislike_count': int,
|
|
||||||
'upload_date': '20220804',
|
|
||||||
'uploader': 'Liputan6.com',
|
|
||||||
'display_id': 'fakta-temuan-suspek-cacar-monyet-di-jawa-tengah',
|
'display_id': 'fakta-temuan-suspek-cacar-monyet-di-jawa-tengah',
|
||||||
'channel': 'ENAM PLUS 165',
|
'ext': 'mp4',
|
||||||
'timestamp': 1659605520,
|
|
||||||
'title': 'Fakta Temuan Suspek Cacar Monyet di Jawa Tengah',
|
'title': 'Fakta Temuan Suspek Cacar Monyet di Jawa Tengah',
|
||||||
'duration': 59,
|
|
||||||
'like_count': int,
|
|
||||||
'tags': ['monkeypox indonesia', 'cacar monyet menyebar', 'suspek cacar monyet di indonesia', 'fakta', 'hoax atau bukan?', 'jawa tengah'],
|
|
||||||
'thumbnail': 'https://thumbor.prod.vidiocdn.com/83PN-_BKm5sS7emLtRxl506MLqQ=/640x360/filters:quality(70)/vidio-web-prod-video/uploads/video/image/7115874/fakta-suspek-cacar-monyet-di-jawa-tengah-24555a.jpg',
|
|
||||||
'uploader_url': 'https://www.vidio.com/@liputan6',
|
|
||||||
'description': 'md5:6d595a18d3b19ee378e335a6f288d5ac',
|
'description': 'md5:6d595a18d3b19ee378e335a6f288d5ac',
|
||||||
|
'thumbnail': r're:^https?://thumbor\.prod\.vidiocdn\.com/.+\.jpg$',
|
||||||
|
'duration': 59,
|
||||||
|
'uploader': 'liputan6',
|
||||||
|
'timestamp': 1659605693,
|
||||||
|
'upload_date': '20220804',
|
||||||
|
'uploader_id': '139',
|
||||||
|
'channel': 'enam-plus-165',
|
||||||
|
'channel_id': '40172876',
|
||||||
|
'channel_url': 'https://www.vidio.com/@liputan6/channels/40172876-enam-plus-165',
|
||||||
|
'tags': ['monkeypox-indonesia', 'cacar-monyet-menyebar', 'suspek-cacar-monyet-di-indonesia', 'fakta', 'hoax-atau-bukan', 'jawa-tengah'],
|
||||||
|
'uploader_url': 'https://www.vidio.com/@liputan6',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'genres': ['health'],
|
||||||
|
'season_id': '',
|
||||||
|
'season_name': '',
|
||||||
|
'age_limit': 13,
|
||||||
|
'comment_count': int,
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'getcomments': True,
|
||||||
},
|
},
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
match = self._match_valid_url(url).groupdict()
|
video_id, display_id = self._match_valid_url(url).group('id', 'display_id')
|
||||||
video_id, display_id = match.get('id'), match.get('display_id')
|
|
||||||
data = self._call_api('https://api.vidio.com/videos/' + video_id, display_id)
|
|
||||||
video = data['videos'][0]
|
|
||||||
title = video['title'].strip()
|
|
||||||
is_premium = video.get('is_premium')
|
|
||||||
|
|
||||||
if is_premium:
|
webpage = self._download_webpage(url, video_id)
|
||||||
sources = self._download_json(
|
api_data = self._call_api(f'https://api.vidio.com/videos/{video_id}', display_id, 'Downloading API data')
|
||||||
f'https://www.vidio.com/interactions_stream.json?video_id={video_id}&type=videos',
|
interactions_stream = self._download_json(
|
||||||
display_id, note='Downloading premier API JSON')
|
'https://www.vidio.com/interactions_stream.json', video_id,
|
||||||
if not (sources.get('source') or sources.get('source_dash')):
|
query={'video_id': video_id, 'type': 'videos'}, note='Downloading stream info',
|
||||||
self.raise_login_required('This video is only available for registered users with the appropriate subscription')
|
errnote='Unable to download stream info')
|
||||||
|
|
||||||
formats, subs = [], {}
|
attrs = extract_attributes(get_element_html_by_id(f'player-data-{video_id}', webpage))
|
||||||
if sources.get('source'):
|
|
||||||
hls_formats, hls_subs = self._extract_m3u8_formats_and_subtitles(
|
|
||||||
sources['source'], display_id, 'mp4', 'm3u8_native')
|
|
||||||
formats.extend(hls_formats)
|
|
||||||
subs.update(hls_subs)
|
|
||||||
if sources.get('source_dash'): # TODO: Find video example with source_dash
|
|
||||||
dash_formats, dash_subs = self._extract_mpd_formats_and_subtitles(
|
|
||||||
sources['source_dash'], display_id, 'dash')
|
|
||||||
formats.extend(dash_formats)
|
|
||||||
subs.update(dash_subs)
|
|
||||||
else:
|
|
||||||
hls_url = data['clips'][0]['hls_url']
|
|
||||||
formats, subs = self._extract_m3u8_formats_and_subtitles(
|
|
||||||
hls_url, display_id, 'mp4', 'm3u8_native')
|
|
||||||
|
|
||||||
get_first = lambda x: try_get(data, lambda y: y[x + 's'][0], dict) or {}
|
if traverse_obj(attrs, ('data-drm-enabled', {lambda x: x == 'true'})):
|
||||||
channel = get_first('channel')
|
self.report_drm(video_id)
|
||||||
user = get_first('user')
|
if traverse_obj(attrs, ('data-geoblock', {lambda x: x == 'true'})):
|
||||||
username = user.get('username')
|
self.raise_geo_restricted(
|
||||||
get_count = lambda x: int_or_none(video.get('total_' + x))
|
'This show isn\'t available in your country', countries=['ID'], metadata_available=True)
|
||||||
|
|
||||||
|
subtitles = dict(traverse_obj(attrs, ('data-subtitles', {json.loads}, ..., {
|
||||||
|
lambda x: (x['language'], [{'url': x['file']['url']}]),
|
||||||
|
})))
|
||||||
|
formats = []
|
||||||
|
|
||||||
|
# There are time-based strings in the playlist URL,
|
||||||
|
# so try the other URL iff no formats extracted from the prior one.
|
||||||
|
|
||||||
|
for m3u8_url in traverse_obj([
|
||||||
|
interactions_stream.get('source'),
|
||||||
|
attrs.get('data-vjs-clip-hls-url'),
|
||||||
|
], (..., {url_or_none})):
|
||||||
|
fmt, subs = self._extract_m3u8_formats_and_subtitles(m3u8_url, video_id, ext='mp4', m3u8_id='hls')
|
||||||
|
formats.extend(fmt)
|
||||||
|
self._merge_subtitles(subs, subtitles)
|
||||||
|
if fmt:
|
||||||
|
break
|
||||||
|
|
||||||
|
for mpd_url in traverse_obj([
|
||||||
|
interactions_stream.get('source_dash'),
|
||||||
|
attrs.get('data-vjs-clip-dash-url'),
|
||||||
|
], (..., {url_or_none})):
|
||||||
|
fmt, subs = self._extract_mpd_formats_and_subtitles(mpd_url, video_id, mpd_id='dash')
|
||||||
|
formats.extend(fmt)
|
||||||
|
self._merge_subtitles(subs, subtitles)
|
||||||
|
if fmt:
|
||||||
|
break
|
||||||
|
|
||||||
|
# TODO: extract also short previews of premier-exclusive videos from "attrs['data-content-preview-url']".
|
||||||
|
|
||||||
|
uploader = attrs.get('data-video-username')
|
||||||
|
uploader_url = f'https://www.vidio.com/@{uploader}'
|
||||||
|
channel = attrs.get('data-video-channel')
|
||||||
|
channel_id = attrs.get('data-video-channel-id')
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'display_id': display_id,
|
'display_id': display_id,
|
||||||
'title': title,
|
'title': (traverse_obj(api_data, ('videos', 0, 'title'))
|
||||||
'description': strip_or_none(video.get('description')),
|
or attrs.get('data-video-title')
|
||||||
'thumbnail': video.get('image_url_medium'),
|
or self._html_extract_title(webpage)),
|
||||||
'duration': int_or_none(video.get('duration')),
|
'live_status': 'not_live',
|
||||||
'like_count': get_count('likes'),
|
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
'subtitles': subs,
|
'subtitles': subtitles,
|
||||||
'uploader': user.get('name'),
|
'channel': channel,
|
||||||
'timestamp': parse_iso8601(video.get('created_at')),
|
'channel_id': channel_id,
|
||||||
'uploader_id': username,
|
'channel_url': f'{uploader_url}/channels/{channel_id}-{channel}',
|
||||||
'uploader_url': format_field(username, None, 'https://www.vidio.com/@%s'),
|
'genres': traverse_obj(attrs, ('data-genres', {str}, {lambda x: x.split(',') if x else []}), default=[]),
|
||||||
'channel': channel.get('name'),
|
'season_id': traverse_obj(attrs, ('data-season-id', {str_or_none})),
|
||||||
'channel_id': str_or_none(channel.get('id')),
|
'season_name': traverse_obj(attrs, ('data-season-name', {str})),
|
||||||
'view_count': get_count('view_count'),
|
'uploader': uploader,
|
||||||
'dislike_count': get_count('dislikes'),
|
'uploader_id': traverse_obj(attrs, ('data-video-user-id', {str_or_none})),
|
||||||
'comment_count': get_count('comments'),
|
'uploader_url': uploader_url,
|
||||||
'tags': video.get('tag_list'),
|
'thumbnail': traverse_obj(attrs, ('data-video-image-url', {url_or_none})),
|
||||||
|
'duration': traverse_obj(attrs, ('data-video-duration', {str_to_int})),
|
||||||
|
'description': traverse_obj(attrs, ('data-video-description', {str})),
|
||||||
|
'availability': self._availability(needs_premium=(attrs.get('data-access-type') == 'premium')),
|
||||||
|
'tags': traverse_obj(attrs, ('data-video-tags', {str}, {lambda x: x.split(',') if x else []}), default=[]),
|
||||||
|
'timestamp': traverse_obj(attrs, ('data-video-publish-date', {lambda x: parse_iso8601(x, ' ')})),
|
||||||
|
'age_limit': (traverse_obj(attrs, ('data-adult', {lambda x: 18 if x == 'true' else 0}))
|
||||||
|
or traverse_obj(attrs, ('data-content-rating-option', {lambda x: remove_end(x, ' or more')}, {str_to_int}))),
|
||||||
|
'__post_extractor': self.extract_comments(video_id),
|
||||||
}
|
}
|
||||||
|
|
||||||
|
def _get_comments(self, video_id):
|
||||||
|
# TODO: extract replies under comments
|
||||||
|
|
||||||
|
def extract_comments(comments_data):
|
||||||
|
users = dict(traverse_obj(comments_data, ('included', ..., {
|
||||||
|
lambda x: (x['id'], {
|
||||||
|
'author': x['attributes']['username'],
|
||||||
|
'author_thumbnail': url_or_none(x['attributes']['avatar_url_big'] or x['attributes']['avatar_url_small']),
|
||||||
|
'author_url': url_or_none(x['links']['self']),
|
||||||
|
}),
|
||||||
|
})))
|
||||||
|
yield from traverse_obj(comments_data, ('data', ..., {
|
||||||
|
'id': 'id',
|
||||||
|
'text': ('attributes', 'content'),
|
||||||
|
'timestamp': ('attributes', 'created_at', {parse_iso8601}),
|
||||||
|
'like_count': ('attributes', 'likes'),
|
||||||
|
'author_id': ('attributes', 'user_id'),
|
||||||
|
}, {lambda x: {**x, **users.get(x['author_id'])}}))
|
||||||
|
|
||||||
|
comment_page_url = f'https://api.vidio.com/videos/{video_id}/comments'
|
||||||
|
while comment_page_url:
|
||||||
|
comments_data = self._call_api(comment_page_url, video_id, 'Downloading comments')
|
||||||
|
comment_page_url = traverse_obj(comments_data, ('links', 'next', {url_or_none}))
|
||||||
|
yield from extract_comments(comments_data)
|
||||||
|
|
||||||
|
|
||||||
class VidioPremierIE(VidioBaseIE):
|
class VidioPremierIE(VidioBaseIE):
|
||||||
_VALID_URL = r'https?://(?:www\.)?vidio\.com/premier/(?P<id>\d+)/(?P<display_id>[^/?#&]+)'
|
_VALID_URL = r'https?://(?:www\.)?vidio\.com/premier/(?P<id>\d+)/(?P<display_id>[^/?#&]+)'
|
||||||
|
|
Loading…
Reference in a new issue