mirror of https://github.com/yt-dlp/yt-dlp.git
113 lines
5.1 KiB
Python
113 lines
5.1 KiB
Python
from .brightcove import BrightcoveNewIE
|
||
from .common import InfoExtractor
|
||
|
||
from ..utils import (
|
||
ExtractorError,
|
||
traverse_obj
|
||
)
|
||
|
||
|
||
class OneNewsNZIE(InfoExtractor):
|
||
IE_NAME = '1News'
|
||
IE_DESC = '1news.co.nz article videos'
|
||
_VALID_URL = r'https?://(?:www\.)?(?:1|one)news\.co\.nz/\d+/\d+/\d+/(?P<id>[^/?#&]+)'
|
||
_TESTS = [
|
||
{ # Brightcove video
|
||
'url': 'https://www.1news.co.nz/2022/09/29/cows-painted-green-on-parliament-lawn-in-climate-protest/',
|
||
'info_dict': {
|
||
'id': 'cows-painted-green-on-parliament-lawn-in-climate-protest',
|
||
'title': '\'Cows\' painted green on Parliament lawn in climate protest',
|
||
},
|
||
'playlist': [{
|
||
'info_dict': {
|
||
'id': '6312993358112',
|
||
'title': 'Activists dressed as cows painted green outside Parliament in climate protest',
|
||
'ext': 'mp4',
|
||
'tags': 'count:6',
|
||
'uploader_id': '963482464001',
|
||
'timestamp': 1664416255,
|
||
'upload_date': '20220929',
|
||
'duration': 38.272,
|
||
'thumbnail': r're:^https?://.*\.jpg$',
|
||
'description': 'Greenpeace accused the Government of "greenwashing" instead of taking climate action.',
|
||
}
|
||
}]
|
||
}, {
|
||
# YouTube video
|
||
'url': 'https://www.1news.co.nz/2022/09/30/now-is-the-time-to-care-about-womens-rugby/',
|
||
'info_dict': {
|
||
'id': 'now-is-the-time-to-care-about-womens-rugby',
|
||
'title': 'Now is the time to care about women\'s rugby',
|
||
},
|
||
'playlist': [{
|
||
'info_dict': {
|
||
'id': 's4wEB9neTfU',
|
||
'title': 'Why I love women’s rugby: Black Fern Ruahei Demant',
|
||
'ext': 'mp4',
|
||
'channel_follower_count': int,
|
||
'channel_url': 'https://www.youtube.com/channel/UC2BQ3U9IxoYIJyulv0bN5PQ',
|
||
'tags': 'count:12',
|
||
'uploader': 'Re: News',
|
||
'upload_date': '20211215',
|
||
'uploader_id': 'UC2BQ3U9IxoYIJyulv0bN5PQ',
|
||
'uploader_url': 'http://www.youtube.com/channel/UC2BQ3U9IxoYIJyulv0bN5PQ',
|
||
'channel_id': 'UC2BQ3U9IxoYIJyulv0bN5PQ',
|
||
'channel': 'Re: News',
|
||
'like_count': int,
|
||
'thumbnail': 'https://i.ytimg.com/vi/s4wEB9neTfU/maxresdefault.jpg',
|
||
'age_limit': 0,
|
||
'view_count': int,
|
||
'categories': ['Sports'],
|
||
'duration': 222,
|
||
'description': 'md5:8874410e5740ed1d8fd0df839f849813',
|
||
'availability': 'public',
|
||
'playable_in_embed': True,
|
||
'live_status': 'not_live',
|
||
}
|
||
}]
|
||
}, {
|
||
# 2 Brightcove videos
|
||
'url': 'https://www.1news.co.nz/2022/09/29/raw-videos-capture-hurricane-ians-fury-as-it-slams-florida/',
|
||
'info_dict': {
|
||
'id': 'raw-videos-capture-hurricane-ians-fury-as-it-slams-florida',
|
||
'title': 'Raw videos capture Hurricane Ian\'s fury as it slams Florida',
|
||
},
|
||
'playlist_mincount': 2,
|
||
}, {
|
||
'url': 'https://www.onenews.co.nz/2022/09/29/cows-painted-green-on-parliament-lawn-in-climate-protest/',
|
||
'only_matching': True,
|
||
}]
|
||
|
||
BRIGHTCOVE_URL_TEMPLATE = 'http://players.brightcove.net/%s/0xpHIR6IB_default/index.html?videoId=%s'
|
||
|
||
def _real_extract(self, url):
|
||
display_id = self._match_id(url)
|
||
webpage = self._download_webpage(url, display_id)
|
||
|
||
fusion_metadata = self._search_json(r'Fusion\.globalContent\s*=', webpage, 'fusion metadata', display_id)
|
||
|
||
entries = []
|
||
for item in traverse_obj(fusion_metadata, 'content_elements') or []:
|
||
item_type = traverse_obj(item, 'subtype')
|
||
if item_type == 'video':
|
||
brightcove_config = traverse_obj(item, ('embed', 'config'))
|
||
brightcove_url = self.BRIGHTCOVE_URL_TEMPLATE % (
|
||
traverse_obj(brightcove_config, 'brightcoveAccount') or '963482464001',
|
||
traverse_obj(brightcove_config, 'brightcoveVideoId')
|
||
)
|
||
entries.append(self.url_result(brightcove_url, BrightcoveNewIE))
|
||
elif item_type == 'youtube':
|
||
video_id_or_url = traverse_obj(item, ('referent', 'id'), ('raw_oembed', '_id'))
|
||
if video_id_or_url:
|
||
entries.append(self.url_result(video_id_or_url, ie='Youtube'))
|
||
|
||
if not entries:
|
||
raise ExtractorError('This article does not have a video.', expected=True)
|
||
|
||
playlist_title = (
|
||
traverse_obj(fusion_metadata, ('headlines', 'basic'))
|
||
or self._og_search_title(webpage)
|
||
or self._html_extract_title(webpage)
|
||
)
|
||
return self.playlist_result(entries, display_id, playlist_title)
|