mirror of
https://github.com/yt-dlp/yt-dlp
synced 2025-01-19 10:26:56 +01:00
[ie/afl][ie/omnyfm] added AFLPodcastIE and updated OmnyFMShowIE
1. AFLPodcastIE: Added extractor for AFL podcasts 2. OmnyFMShowIE: Updated code to adjust url before download page to support various url patterns
This commit is contained in:
parent
8125680192
commit
5fea24bda2
3 changed files with 30 additions and 2 deletions
|
@ -76,7 +76,7 @@ from .aenetworks import (
|
||||||
)
|
)
|
||||||
from .aeonco import AeonCoIE
|
from .aeonco import AeonCoIE
|
||||||
from .afl import (
|
from .afl import (
|
||||||
AFLPodcastsIE,
|
AFLPodcastIE,
|
||||||
AFLVideoIE,
|
AFLVideoIE,
|
||||||
)
|
)
|
||||||
from .afreecatv import (
|
from .afreecatv import (
|
||||||
|
|
|
@ -1,12 +1,14 @@
|
||||||
|
|
||||||
from .brightcove import BrightcoveNewIE
|
from .brightcove import BrightcoveNewIE
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
|
from .omnyfm import OmnyFMShowIE
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
extract_attributes,
|
extract_attributes,
|
||||||
get_element_by_class,
|
get_element_by_class,
|
||||||
smuggle_url,
|
smuggle_url,
|
||||||
str_or_none,
|
str_or_none,
|
||||||
traverse_obj,
|
traverse_obj,
|
||||||
|
url_or_none,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
@ -52,3 +54,27 @@ class AFLVideoIE(InfoExtractor):
|
||||||
video_url = f'https://players.brightcove.net/{account_id}/{player_id}/index.html?videoId={video_id}'
|
video_url = f'https://players.brightcove.net/{account_id}/{player_id}/index.html?videoId={video_id}'
|
||||||
video_url = smuggle_url(video_url, {'referrer': url})
|
video_url = smuggle_url(video_url, {'referrer': url})
|
||||||
return self.url_result(video_url, BrightcoveNewIE)
|
return self.url_result(video_url, BrightcoveNewIE)
|
||||||
|
|
||||||
|
|
||||||
|
class AFLPodcastIE(InfoExtractor):
|
||||||
|
IE_NAME = 'afl:podcast'
|
||||||
|
_VALID_URL = r'https?://(?:www\.)?afl\.com.au/(?:aflw/)?podcasts/(?P<id>[\w-]+)'
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'https://www.afl.com.au/podcasts/between-us',
|
||||||
|
'md5': '7000431c2bd3f96eddb5f63273aea83e',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'e0ab8454-f818-483f-bed1-b156002c021f',
|
||||||
|
'title': 'Between Us',
|
||||||
|
},
|
||||||
|
'playlist_mincount': 7,
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.afl.com.au/podcasts/afl-daily',
|
||||||
|
'only_matching': True,
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
display_id = self._match_id(url)
|
||||||
|
webpage = self._download_webpage(url, display_id)
|
||||||
|
element = get_element_by_class('omny-embed', webpage)
|
||||||
|
podcast_url = traverse_obj(extract_attributes(element), ('src', {url_or_none}))
|
||||||
|
return self.url_result(podcast_url, OmnyFMShowIE)
|
||||||
|
|
|
@ -19,6 +19,7 @@ from ..utils import (
|
||||||
class OmnyFMShowIE(InfoExtractor):
|
class OmnyFMShowIE(InfoExtractor):
|
||||||
IE_NAME = 'omnyfm:show'
|
IE_NAME = 'omnyfm:show'
|
||||||
_VALID_URL = r'https?://omny\.fm/shows/(?P<id>[\w-]+)'
|
_VALID_URL = r'https?://omny\.fm/shows/(?P<id>[\w-]+)'
|
||||||
|
_EMBED_REGEX = [r'<iframe[^>]+?src=(?:["\'])(?P<url>https?://omny\.fm/shows/.+?)\1']
|
||||||
_PAGE_SIZE = 10
|
_PAGE_SIZE = 10
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'https://omny.fm/shows/league-leaders',
|
'url': 'https://omny.fm/shows/league-leaders',
|
||||||
|
@ -53,7 +54,8 @@ class OmnyFMShowIE(InfoExtractor):
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
display_id = self._match_id(url)
|
display_id = self._match_id(url)
|
||||||
webpage = self._download_webpage(url, display_id)
|
page_url = 'https://omny.fm/shows/' + display_id
|
||||||
|
webpage = self._download_webpage(page_url, display_id)
|
||||||
|
|
||||||
data = json.loads(get_element_by_id('__NEXT_DATA__', webpage))
|
data = json.loads(get_element_by_id('__NEXT_DATA__', webpage))
|
||||||
org_id = traverse_obj(data, ('props', 'pageProps', 'program', 'OrganizationId', {str_or_none}))
|
org_id = traverse_obj(data, ('props', 'pageProps', 'program', 'OrganizationId', {str_or_none}))
|
||||||
|
|
Loading…
Reference in a new issue