mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-10 15:14:57 +00:00
[extractor/cbs] Add ParamountPressExpress
extractor (#6604)
Closes #6597 Authored by: bashonly
This commit is contained in:
parent
c2e0fc40a7
commit
44369c9afa
3 changed files with 121 additions and 3 deletions
|
@ -298,7 +298,10 @@ from .cbc import (
|
||||||
CBCGemPlaylistIE,
|
CBCGemPlaylistIE,
|
||||||
CBCGemLiveIE,
|
CBCGemLiveIE,
|
||||||
)
|
)
|
||||||
from .cbs import CBSIE
|
from .cbs import (
|
||||||
|
CBSIE,
|
||||||
|
ParamountPressExpressIE,
|
||||||
|
)
|
||||||
from .cbslocal import (
|
from .cbslocal import (
|
||||||
CBSLocalIE,
|
CBSLocalIE,
|
||||||
CBSLocalArticleIE,
|
CBSLocalArticleIE,
|
||||||
|
|
|
@ -575,6 +575,7 @@ class BrightcoveNewBaseIE(AdobePassIE):
|
||||||
self.raise_no_formats(
|
self.raise_no_formats(
|
||||||
error.get('message') or error.get('error_subcode') or error['error_code'], expected=True)
|
error.get('message') or error.get('error_subcode') or error['error_code'], expected=True)
|
||||||
|
|
||||||
|
headers.pop('Authorization', None) # or else http formats will give error 400
|
||||||
for f in formats:
|
for f in formats:
|
||||||
f.setdefault('http_headers', {}).update(headers)
|
f.setdefault('http_headers', {}).update(headers)
|
||||||
|
|
||||||
|
@ -895,8 +896,9 @@ class BrightcoveNewIE(BrightcoveNewBaseIE):
|
||||||
store_pk(policy_key)
|
store_pk(policy_key)
|
||||||
return policy_key
|
return policy_key
|
||||||
|
|
||||||
api_url = 'https://edge.api.brightcove.com/playback/v1/accounts/%s/%ss/%s' % (account_id, content_type, video_id)
|
token = smuggled_data.get('token')
|
||||||
headers = {}
|
api_url = f'https://{"edge-auth" if token else "edge"}.api.brightcove.com/playback/v1/accounts/{account_id}/{content_type}s/{video_id}'
|
||||||
|
headers = {'Authorization': f'Bearer {token}'} if token else {}
|
||||||
referrer = smuggled_data.get('referrer') # XXX: notice the spelling/case of the key
|
referrer = smuggled_data.get('referrer') # XXX: notice the spelling/case of the key
|
||||||
if referrer:
|
if referrer:
|
||||||
headers.update({
|
headers.update({
|
||||||
|
|
|
@ -1,8 +1,14 @@
|
||||||
|
from .brightcove import BrightcoveNewIE
|
||||||
|
from .common import InfoExtractor
|
||||||
from .theplatform import ThePlatformFeedIE
|
from .theplatform import ThePlatformFeedIE
|
||||||
|
from .youtube import YoutubeIE
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
|
extract_attributes,
|
||||||
|
get_element_html_by_id,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
find_xpath_attr,
|
find_xpath_attr,
|
||||||
|
smuggle_url,
|
||||||
xpath_element,
|
xpath_element,
|
||||||
xpath_text,
|
xpath_text,
|
||||||
update_url_query,
|
update_url_query,
|
||||||
|
@ -162,3 +168,110 @@ class CBSIE(CBSBaseIE):
|
||||||
'duration': int_or_none(xpath_text(video_data, 'videoLength'), 1000),
|
'duration': int_or_none(xpath_text(video_data, 'videoLength'), 1000),
|
||||||
'thumbnail': url_or_none(xpath_text(video_data, 'previewImageURL')),
|
'thumbnail': url_or_none(xpath_text(video_data, 'previewImageURL')),
|
||||||
})
|
})
|
||||||
|
|
||||||
|
|
||||||
|
class ParamountPressExpressIE(InfoExtractor):
|
||||||
|
_VALID_URL = r'https?://(?:www\.)?paramountpressexpress\.com(?:/[\w-]+)+/(?P<yt>yt-)?video/?\?watch=(?P<id>[\w-]+)'
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'https://www.paramountpressexpress.com/cbs-entertainment/shows/survivor/video/?watch=pnzew7e2hx',
|
||||||
|
'md5': '56631dbcadaab980d1fc47cb7b76cba4',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '6322981580112',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'I’m Felicia',
|
||||||
|
'description': 'md5:88fad93f8eede1c9c8f390239e4c6290',
|
||||||
|
'uploader_id': '6055873637001',
|
||||||
|
'upload_date': '20230320',
|
||||||
|
'timestamp': 1679334960,
|
||||||
|
'duration': 49.557,
|
||||||
|
'thumbnail': r're:^https://.+\.jpg',
|
||||||
|
'tags': [],
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.paramountpressexpress.com/cbs-entertainment/video/?watch=2s5eh8kppc',
|
||||||
|
'md5': 'edcb03e3210b88a3e56c05aa863e0e5b',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '6323036027112',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': '‘Y&R’ Set Visit: Jerry O’Connell Quizzes Cast on Pre-Love Scene Rituals and More',
|
||||||
|
'description': 'md5:b929867a357aac5544b783d834c78383',
|
||||||
|
'uploader_id': '6055873637001',
|
||||||
|
'upload_date': '20230321',
|
||||||
|
'timestamp': 1679430180,
|
||||||
|
'duration': 132.032,
|
||||||
|
'thumbnail': r're:^https://.+\.jpg',
|
||||||
|
'tags': [],
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.paramountpressexpress.com/paramount-plus/yt-video/?watch=OX9wJWOcqck',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'OX9wJWOcqck',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Rugrats | Season 2 Official Trailer | Paramount+',
|
||||||
|
'description': 'md5:1f7e26f5625a9f0d6564d9ad97a9f7de',
|
||||||
|
'uploader': 'Paramount Plus',
|
||||||
|
'uploader_id': '@paramountplus',
|
||||||
|
'uploader_url': 'http://www.youtube.com/@paramountplus',
|
||||||
|
'channel': 'Paramount Plus',
|
||||||
|
'channel_id': 'UCrRttZIypNTA1Mrfwo745Sg',
|
||||||
|
'channel_url': 'https://www.youtube.com/channel/UCrRttZIypNTA1Mrfwo745Sg',
|
||||||
|
'upload_date': '20230316',
|
||||||
|
'duration': 88,
|
||||||
|
'age_limit': 0,
|
||||||
|
'availability': 'public',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'playable_in_embed': True,
|
||||||
|
'view_count': int,
|
||||||
|
'like_count': int,
|
||||||
|
'channel_follower_count': int,
|
||||||
|
'thumbnail': 'https://i.ytimg.com/vi/OX9wJWOcqck/maxresdefault.jpg',
|
||||||
|
'categories': ['Entertainment'],
|
||||||
|
'tags': ['Rugrats'],
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.paramountpressexpress.com/showtime/yt-video/?watch=_ljssSoDLkw',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '_ljssSoDLkw',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Lavell Crawford: THEE Lavell Crawford Comedy Special Official Trailer | SHOWTIME',
|
||||||
|
'description': 'md5:39581bcc3fd810209b642609f448af70',
|
||||||
|
'uploader': 'SHOWTIME',
|
||||||
|
'uploader_id': '@Showtime',
|
||||||
|
'uploader_url': 'http://www.youtube.com/@Showtime',
|
||||||
|
'channel': 'SHOWTIME',
|
||||||
|
'channel_id': 'UCtwMWJr2BFPkuJTnSvCESSQ',
|
||||||
|
'channel_url': 'https://www.youtube.com/channel/UCtwMWJr2BFPkuJTnSvCESSQ',
|
||||||
|
'upload_date': '20230209',
|
||||||
|
'duration': 49,
|
||||||
|
'age_limit': 0,
|
||||||
|
'availability': 'public',
|
||||||
|
'live_status': 'not_live',
|
||||||
|
'playable_in_embed': True,
|
||||||
|
'view_count': int,
|
||||||
|
'like_count': int,
|
||||||
|
'comment_count': int,
|
||||||
|
'channel_follower_count': int,
|
||||||
|
'thumbnail': 'https://i.ytimg.com/vi_webp/_ljssSoDLkw/maxresdefault.webp',
|
||||||
|
'categories': ['People & Blogs'],
|
||||||
|
'tags': 'count:27',
|
||||||
|
},
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
display_id, is_youtube = self._match_valid_url(url).group('id', 'yt')
|
||||||
|
if is_youtube:
|
||||||
|
return self.url_result(display_id, YoutubeIE)
|
||||||
|
|
||||||
|
webpage = self._download_webpage(url, display_id)
|
||||||
|
video_id = self._search_regex(
|
||||||
|
r'\bvideo_id\s*=\s*["\'](\d+)["\']\s*,', webpage, 'Brightcove ID')
|
||||||
|
token = self._search_regex(r'\btoken\s*=\s*["\']([\w.-]+)["\']', webpage, 'token')
|
||||||
|
|
||||||
|
player = extract_attributes(get_element_html_by_id('vcbrightcoveplayer', webpage) or '')
|
||||||
|
account_id = player.get('data-account') or '6055873637001'
|
||||||
|
player_id = player.get('data-player') or 'OtLKgXlO9F'
|
||||||
|
embed = player.get('data-embed') or 'default'
|
||||||
|
|
||||||
|
return self.url_result(smuggle_url(
|
||||||
|
f'https://players.brightcove.net/{account_id}/{player_id}_{embed}/index.html?videoId={video_id}',
|
||||||
|
{'token': token}), BrightcoveNewIE)
|
||||||
|
|
Loading…
Reference in a new issue