mirror of
https://github.com/yt-dlp/yt-dlp
synced 2025-01-15 03:41:33 +01:00
[extractor/tennistv] Rewrite extractor (#2324)
Closes #2177 Authored by: zenerdi0de, pukkandan
This commit is contained in:
parent
0c36dc00d7
commit
37e40d693b
1 changed files with 111 additions and 64 deletions
|
@ -1,16 +1,17 @@
|
||||||
import json
|
import urllib.parse
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
|
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
|
random_uuidv4,
|
||||||
unified_timestamp,
|
unified_timestamp,
|
||||||
|
urlencode_postdata,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class TennisTVIE(InfoExtractor):
|
class TennisTVIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?tennistv\.com/videos/(?P<id>[-a-z0-9]+)'
|
_VALID_URL = r'https?://(?:www\.)?tennistv\.com/videos/(?P<id>[-a-z0-9]+)'
|
||||||
_TEST = {
|
_TESTS = [{
|
||||||
'url': 'https://www.tennistv.com/videos/indian-wells-2018-verdasco-fritz',
|
'url': 'https://www.tennistv.com/videos/indian-wells-2018-verdasco-fritz',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': 'indian-wells-2018-verdasco-fritz',
|
'id': 'indian-wells-2018-verdasco-fritz',
|
||||||
|
@ -25,86 +26,132 @@ class TennisTVIE(InfoExtractor):
|
||||||
'skip_download': True,
|
'skip_download': True,
|
||||||
},
|
},
|
||||||
'skip': 'Requires email and password of a subscribed account',
|
'skip': 'Requires email and password of a subscribed account',
|
||||||
}
|
}, {
|
||||||
|
'url': 'https://www.tennistv.com/videos/2650480/best-matches-of-2022-part-5',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '2650480',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Best Matches of 2022 - Part 5',
|
||||||
|
'description': 'md5:36dec3bfae7ed74bd79e48045b17264c',
|
||||||
|
'thumbnail': 'https://open.http.mp.streamamg.com/p/3001482/sp/300148200/thumbnail/entry_id/0_myef18pd/version/100001/height/1920',
|
||||||
|
},
|
||||||
|
'params': {'skip_download': 'm3u8'},
|
||||||
|
'skip': 'Requires email and password of a subscribed account',
|
||||||
|
}]
|
||||||
_NETRC_MACHINE = 'tennistv'
|
_NETRC_MACHINE = 'tennistv'
|
||||||
_session_token = None
|
|
||||||
|
access_token, refresh_token = None, None
|
||||||
|
_PARTNER_ID = 3001482
|
||||||
|
_FORMAT_URL = 'https://open.http.mp.streamamg.com/p/{partner}/sp/{partner}00/playManifest/entryId/{entry}/format/applehttp/protocol/https/a.m3u8?ks={session}'
|
||||||
|
_AUTH_BASE_URL = 'https://sso.tennistv.com/auth/realms/TennisTV/protocol/openid-connect'
|
||||||
|
_HEADERS = {
|
||||||
|
'origin': 'https://www.tennistv.com',
|
||||||
|
'referer': 'https://www.tennistv.com/',
|
||||||
|
'content-Type': 'application/x-www-form-urlencoded'
|
||||||
|
}
|
||||||
|
|
||||||
def _perform_login(self, username, password):
|
def _perform_login(self, username, password):
|
||||||
|
login_page = self._download_webpage(
|
||||||
|
f'{self._AUTH_BASE_URL}/auth', None, 'Downloading login page',
|
||||||
|
query={
|
||||||
|
'client_id': 'tennis-tv-web',
|
||||||
|
'redirect_uri': 'https://tennistv.com',
|
||||||
|
'response_mode': 'fragment',
|
||||||
|
'response_type': 'code',
|
||||||
|
'scope': 'openid'
|
||||||
|
})
|
||||||
|
|
||||||
login_form = {
|
post_url = self._html_search_regex(r'action=["\']([^"\']+?)["\']\s+method=["\']post["\']', login_page, 'login POST url')
|
||||||
'Email': username,
|
temp_page = self._download_webpage(
|
||||||
'Password': password,
|
post_url, None, 'Sending login data', 'Unable to send login data',
|
||||||
}
|
headers=self._HEADERS, data=urlencode_postdata({
|
||||||
login_json = json.dumps(login_form).encode('utf-8')
|
'username': username,
|
||||||
headers = {
|
'password': password,
|
||||||
'content-type': 'application/json',
|
'submitAction': 'Log In'
|
||||||
'Referer': 'https://www.tennistv.com/login',
|
}))
|
||||||
'Origin': 'https://www.tennistv.com',
|
if 'Your username or password was incorrect' in temp_page:
|
||||||
}
|
raise ExtractorError('Your username or password was incorrect', expected=True)
|
||||||
|
|
||||||
login_result = self._download_json(
|
handle = self._request_webpage(
|
||||||
'https://www.tennistv.com/api/users/v1/login', None,
|
f'{self._AUTH_BASE_URL}/auth', None, 'Logging in', headers=self._HEADERS,
|
||||||
note='Logging in',
|
query={
|
||||||
errnote='Login failed (wrong password?)',
|
'client_id': 'tennis-tv-web',
|
||||||
headers=headers,
|
'redirect_uri': 'https://www.tennistv.com/resources/v1.1.10/html/silent-check-sso.html',
|
||||||
data=login_json)
|
'state': random_uuidv4(),
|
||||||
|
'response_mode': 'fragment',
|
||||||
|
'response_type': 'code',
|
||||||
|
'scope': 'openid',
|
||||||
|
'nonce': random_uuidv4(),
|
||||||
|
'prompt': 'none'
|
||||||
|
})
|
||||||
|
|
||||||
if login_result['error']['errorCode']:
|
self.get_token(None, {
|
||||||
raise ExtractorError('Login failed, %s said: %r' % (self.IE_NAME, login_result['error']['errorMessage']))
|
'code': urllib.parse.parse_qs(handle.geturl())['code'][-1],
|
||||||
|
'grant_type': 'authorization_code',
|
||||||
|
'client_id': 'tennis-tv-web',
|
||||||
|
'redirect_uri': 'https://www.tennistv.com/resources/v1.1.10/html/silent-check-sso.html'
|
||||||
|
})
|
||||||
|
|
||||||
if login_result['entitlement'] != 'SUBSCRIBED':
|
def get_token(self, video_id, payload):
|
||||||
self.report_warning('%s may not be subscribed to %s.' % (username, self.IE_NAME))
|
res = self._download_json(
|
||||||
|
f'{self._AUTH_BASE_URL}/token', video_id, 'Fetching tokens',
|
||||||
|
'Unable to fetch tokens', headers=self._HEADERS, data=urlencode_postdata(payload))
|
||||||
|
|
||||||
self._session_token = login_result['sessionToken']
|
self.access_token = res.get('access_token') or self.access_token
|
||||||
|
self.refresh_token = res.get('refresh_token') or self.refresh_token
|
||||||
|
|
||||||
def _real_initialize(self):
|
def _real_initialize(self):
|
||||||
if not self._session_token:
|
if self.access_token and self.refresh_token:
|
||||||
raise self.raise_login_required('Login info is needed for this website', method='password')
|
return
|
||||||
|
|
||||||
|
cookies = self._get_cookies('https://www.tennistv.com/')
|
||||||
|
if not cookies.get('access_token') or not cookies.get('refresh_token'):
|
||||||
|
self.raise_login_required()
|
||||||
|
self.access_token, self.refresh_token = cookies['access_token'].value, cookies['refresh_token'].value
|
||||||
|
|
||||||
|
def _download_session_json(self, video_id, entryid,):
|
||||||
|
return self._download_json(
|
||||||
|
f'https://atppayments.streamamg.com/api/v1/session/ksession/?lang=en&apijwttoken={self.access_token}&entryId={entryid}',
|
||||||
|
video_id, 'Downloading ksession token', 'Failed to download ksession token', headers=self._HEADERS)
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
webpage = self._download_webpage(url, video_id)
|
webpage = self._download_webpage(url, video_id)
|
||||||
|
|
||||||
internal_id = self._search_regex(r'video=([\w-]+)', webpage, 'internal video id')
|
entryid = self._search_regex(r'data-entry-id=["\']([^"\']+)', webpage, 'entryID')
|
||||||
|
session_json = self._download_session_json(video_id, entryid)
|
||||||
|
|
||||||
|
k_session = session_json.get('KSession')
|
||||||
|
if k_session is None:
|
||||||
|
self.get_token(video_id, {
|
||||||
|
'grant_type': 'refresh_token',
|
||||||
|
'refresh_token': self.refresh_token,
|
||||||
|
'client_id': 'tennis-tv-web'
|
||||||
|
})
|
||||||
|
k_session = self._download_session_json(video_id, entryid).get('KSession')
|
||||||
|
if k_session is None:
|
||||||
|
raise ExtractorError('Failed to get KSession, possibly a premium video', expected=True)
|
||||||
|
|
||||||
|
if session_json.get('ErrorMessage'):
|
||||||
|
self.report_warning(session_json['ErrorMessage'])
|
||||||
|
|
||||||
|
formats, subtitles = self._extract_m3u8_formats_and_subtitles(
|
||||||
|
self._FORMAT_URL.format(partner=self._PARTNER_ID, entry=entryid, session=k_session), video_id)
|
||||||
|
|
||||||
headers = {
|
|
||||||
'Origin': 'https://www.tennistv.com',
|
|
||||||
'authorization': 'ATP %s' % self._session_token,
|
|
||||||
'content-type': 'application/json',
|
|
||||||
'Referer': url,
|
|
||||||
}
|
|
||||||
check_data = {
|
|
||||||
'videoID': internal_id,
|
|
||||||
'VideoUrlType': 'HLS',
|
|
||||||
}
|
|
||||||
check_json = json.dumps(check_data).encode('utf-8')
|
|
||||||
check_result = self._download_json(
|
|
||||||
'https://www.tennistv.com/api/users/v1/entitlementchecknondiva',
|
|
||||||
video_id, note='Checking video authorization', headers=headers, data=check_json)
|
|
||||||
formats = self._extract_m3u8_formats(check_result['contentUrl'], video_id, ext='mp4')
|
|
||||||
self._sort_formats(formats)
|
self._sort_formats(formats)
|
||||||
|
|
||||||
vdata = self._download_json(
|
|
||||||
'https://www.tennistv.com/api/en/v2/none/common/video/%s' % video_id,
|
|
||||||
video_id, headers=headers)
|
|
||||||
|
|
||||||
timestamp = unified_timestamp(vdata['timestamp'])
|
|
||||||
thumbnail = vdata['video']['thumbnailUrl']
|
|
||||||
description = vdata['displayText']['description']
|
|
||||||
title = vdata['video']['title']
|
|
||||||
|
|
||||||
series = vdata['tour']
|
|
||||||
venue = vdata['displayText']['venue']
|
|
||||||
round_str = vdata['seo']['round']
|
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': title,
|
'title': self._html_extract_title(webpage) or self._og_search_title(webpage),
|
||||||
'description': description,
|
'description': self._html_search_regex(
|
||||||
|
(r'<span itemprop="description" content=["\']([^"\']+)["\']>', *self._og_regexes('description')),
|
||||||
|
webpage, 'description', fatal=False),
|
||||||
|
'thumbnail': f'https://open.http.mp.streamamg.com/p/{self._PARTNER_ID}/sp/{self._PARTNER_ID}00/thumbnail/entry_id/{entryid}/version/100001/height/1920',
|
||||||
|
'timestamp': unified_timestamp(self._html_search_regex(
|
||||||
|
r'<span itemprop="description" content=["\']([^"\']+)["\']>', webpage, 'upload time')),
|
||||||
|
'series': self._html_search_regex(r'data-series\s*?=\s*?"(.*?)"', webpage, 'series', fatal=False) or None,
|
||||||
|
'season': self._html_search_regex(r'data-tournament-city\s*?=\s*?"(.*?)"', webpage, 'season', fatal=False) or None,
|
||||||
|
'episode': self._html_search_regex(r'data-round\s*?=\s*?"(.*?)"', webpage, 'round', fatal=False) or None,
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
'thumbnail': thumbnail,
|
'subtitles': subtitles,
|
||||||
'timestamp': timestamp,
|
|
||||||
'series': series,
|
|
||||||
'season': venue,
|
|
||||||
'episode': round_str,
|
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue