yt-dlp/yt_dlp/extractor/dtube.py

import json
import socket

from .common import InfoExtractor
from ..utils import (
    int_or_none,
    parse_iso8601,
)


class DTubeIE(InfoExtractor):
    _WORKING = False
    _VALID_URL = r'https?://(?:www\.)?d\.tube/(?:#!/)?v/(?P<uploader_id>[0-9a-z.-]+)/(?P<id>[0-9a-z]{8})'
    _TEST = {
        'url': 'https://d.tube/#!/v/broncnutz/x380jtr1',
        'md5': '9f29088fa08d699a7565ee983f56a06e',
        'info_dict': {
            'id': 'x380jtr1',
            'ext': 'mp4',
            'title': 'Lefty 3-Rings is Back Baby!! NCAA Picks',
            'description': 'md5:60be222088183be3a42f196f34235776',
            'uploader_id': 'broncnutz',
            'upload_date': '20190107',
            'timestamp': 1546854054,
        },
        'params': {
            'format': '480p',
        },
    }

    def _real_extract(self, url):
        uploader_id, video_id = self._match_valid_url(url).groups()
        result = self._download_json('https://api.steemit.com/', video_id, data=json.dumps({
            'jsonrpc': '2.0',
            'method': 'get_content',
            'params': [uploader_id, video_id],
        }).encode())['result']

        metadata = json.loads(result['json_metadata'])
        video = metadata['video']
        content = video['content']
        info = video.get('info', {})
        title = info.get('title') or result['title']

        def canonical_url(h):
            if not h:
                return None
            return 'https://video.dtube.top/ipfs/' + h

        formats = []
        for q in ('240', '480', '720', '1080', ''):
            video_url = canonical_url(content.get(f'video{q}hash'))
            if not video_url:
                continue
            format_id = (q + 'p') if q else 'Source'
            try:
                self.to_screen(f'{video_id}: Checking {format_id} video format URL')
                self._downloader._opener.open(video_url, timeout=5).close()
            except socket.timeout:
                self.to_screen(
                    f'{video_id}: {format_id} URL is invalid, skipping')
                continue
            formats.append({
                'format_id': format_id,
                'url': video_url,
                'height': int_or_none(q),
                'ext': 'mp4',
            })

        return {
            'id': video_id,
            'title': title,
            'description': content.get('description'),
            'thumbnail': canonical_url(info.get('snaphash')),
            'tags': content.get('tags') or metadata.get('tags'),
            'duration': info.get('duration'),
            'formats': formats,
            'timestamp': parse_iso8601(result.get('created')),
            'uploader_id': uploader_id,
        }
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`import json`
[ie, cleanup] No `from` stdlib imports in extractors (#8978) 2024-04-01 02:01:09 +02:00			`import socket`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00
			`from .common import InfoExtractor`
			`from ..utils import (`
			`int_or_none,`
			`parse_iso8601,`
			`)`


			`class DTubeIE(InfoExtractor):`
[cleanup] Mark broken and remove dead extractors (#9238) Authored by: seproDev 2024-03-09 01:02:45 +01:00			`_WORKING = False`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`_VALID_URL = r'https?://(?:www\.)?d\.tube/(?:#!/)?v/(?P<uploader_id>[0-9a-z.-]+)/(?P<id>[0-9a-z]{8})'`
			`_TEST = {`
[dtube] Update test 2019-01-08 02:46:34 +01:00			`'url': 'https://d.tube/#!/v/broncnutz/x380jtr1',`
			`'md5': '9f29088fa08d699a7565ee983f56a06e',`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`'info_dict': {`
[dtube] Update test 2019-01-08 02:46:34 +01:00			`'id': 'x380jtr1',`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`'ext': 'mp4',`
[dtube] Update test 2019-01-08 02:46:34 +01:00			`'title': 'Lefty 3-Rings is Back Baby!! NCAA Picks',`
			`'description': 'md5:60be222088183be3a42f196f34235776',`
			`'uploader_id': 'broncnutz',`
			`'upload_date': '20190107',`
			`'timestamp': 1546854054,`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`},`
			`'params': {`
			`'format': '480p',`
			`},`
			`}`

			`def _real_extract(self, url):`
[extractor] Common function `_match_valid_url` 2021-08-19 03:41:24 +02:00			`uploader_id, video_id = self._match_valid_url(url).groups()`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`result = self._download_json('https://api.steemit.com/', video_id, data=json.dumps({`
			`'jsonrpc': '2.0',`
			`'method': 'get_content',`
			`'params': [uploader_id, video_id],`
			`}).encode())['result']`

			`metadata = json.loads(result['json_metadata'])`
			`video = metadata['video']`
			`content = video['content']`
			`info = video.get('info', {})`
			`title = info.get('title') or result['title']`

			`def canonical_url(h):`
			`if not h:`
			`return None`
[dtube] Fix extraction (closes #18741) 2019-01-08 02:44:42 +01:00			`return 'https://video.dtube.top/ipfs/' + h`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00
			`formats = []`
			`for q in ('240', '480', '720', '1080', ''):`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-12 01:09:58 +02:00			`video_url = canonical_url(content.get(f'video{q}hash'))`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`if not video_url:`
			`continue`
			`format_id = (q + 'p') if q else 'Source'`
			`try:`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-12 01:09:58 +02:00			`self.to_screen(f'{video_id}: Checking {format_id} video format URL')`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`self._downloader._opener.open(video_url, timeout=5).close()`
[ie, cleanup] No `from` stdlib imports in extractors (#8978) 2024-04-01 02:01:09 +02:00			`except socket.timeout:`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`self.to_screen(`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-12 01:09:58 +02:00			`f'{video_id}: {format_id} URL is invalid, skipping')`
[dtube] Add new extractor(closes #15201) 2018-05-16 09:08:44 +02:00			`continue`
			`formats.append({`
			`'format_id': format_id,`
			`'url': video_url,`
			`'height': int_or_none(q),`
			`'ext': 'mp4',`
			`})`

			`return {`
			`'id': video_id,`
			`'title': title,`
			`'description': content.get('description'),`
			`'thumbnail': canonical_url(info.get('snaphash')),`
			`'tags': content.get('tags') or metadata.get('tags'),`
			`'duration': info.get('duration'),`
			`'formats': formats,`
			`'timestamp': parse_iso8601(result.get('created')),`
			`'uploader_id': uploader_id,`
			`}`