from .common import InfoExtractor from ..utils import ( ExtractorError, extract_attributes, get_element_text_and_html_by_tag, int_or_none, join_nonempty, str_or_none, try_call, unified_timestamp, ) from ..utils.traversal import traverse_obj class DuoplayIE(InfoExtractor): _VALID_URL = r'https://duoplay\.ee/(?P\d+)/[\w-]+/?(?:\?(?:[^#]+&)?ep=(?P\d+))?' _TESTS = [{ 'note': 'Siberi võmm S02E12', 'url': 'https://duoplay.ee/4312/siberi-vomm?ep=24', 'md5': '1ff59d535310ac9c5cf5f287d8f91b2d', 'info_dict': { 'id': '4312_24', 'ext': 'mp4', 'title': 'Operatsioon "Öö"', 'thumbnail': r're:https://.+\.jpg(?:\?c=\d+)?$', 'description': 'md5:8ef98f38569d6b8b78f3d350ccc6ade8', 'upload_date': '20170523', 'timestamp': 1495567800, 'series': 'Siberi võmm', 'series_id': '4312', 'season': 'Season 2', 'season_number': 2, 'episode': 'Operatsioon "Öö"', 'episode_number': 12, 'episode_id': 24, }, }, { 'note': 'Empty title', 'url': 'https://duoplay.ee/17/uhikarotid?ep=14', 'md5': '6aca68be71112314738dd17cced7f8bf', 'info_dict': { 'id': '17_14', 'ext': 'mp4', 'title': 'Ühikarotid', 'thumbnail': r're:https://.+\.jpg(?:\?c=\d+)?$', 'description': 'md5:4719b418e058c209def41d48b601276e', 'upload_date': '20100916', 'timestamp': 1284661800, 'series': 'Ühikarotid', 'series_id': '17', 'season': 'Season 2', 'season_number': 2, 'episode_id': 14, 'release_year': 2010, }, }, { 'note': 'Movie without expiry', 'url': 'https://duoplay.ee/5501/pilvede-all.-neljas-ode', 'md5': '7abf63d773a49ef7c39f2c127842b8fd', 'info_dict': { 'id': '5501', 'ext': 'mp4', 'title': 'Pilvede all. Neljas õde', 'thumbnail': r're:https://.+\.jpg(?:\?c=\d+)?$', 'description': 'md5:d86a70f8f31e82c369d4d4f4c79b1279', 'cast': 'count:9', 'upload_date': '20221214', 'timestamp': 1671054000, 'release_year': 2018, }, }] def _real_extract(self, url): telecast_id, episode = self._match_valid_url(url).group('id', 'ep') video_id = join_nonempty(telecast_id, episode, delim='_') webpage = self._download_webpage(url, video_id) video_player = try_call(lambda: extract_attributes( get_element_text_and_html_by_tag('video-player', webpage)[1])) if not video_player or not video_player.get('manifest-url'): raise ExtractorError('No video found', expected=True) episode_attr = self._parse_json(video_player.get(':episode') or '', video_id, fatal=False) or {} return { 'id': video_id, 'formats': self._extract_m3u8_formats(video_player['manifest-url'], video_id, 'mp4'), **traverse_obj(episode_attr, { 'title': 'title', 'description': 'synopsis', 'thumbnail': ('images', 'original'), 'timestamp': ('airtime', {lambda x: unified_timestamp(x + ' +0200')}), 'cast': ('cast', {lambda x: x.split(', ')}), 'release_year': ('year', {int_or_none}), }), **(traverse_obj(episode_attr, { 'title': (None, ('subtitle', ('episode_nr', {lambda x: f'Episode {x}' if x else None}))), 'series': 'title', 'series_id': ('telecast_id', {str_or_none}), 'season_number': ('season_id', {int_or_none}), 'episode': 'subtitle', 'episode_number': ('episode_nr', {int_or_none}), 'episode_id': ('episode_id', {int_or_none}), }, get_all=False) if episode_attr.get('category') != 'movies' else {}), }