Remove comment extraction code for now

Can be added back in a separate PR
2025-06-06 00:49:20 +02:00 · 2024-11-11 21:14:56 +01:00
parent 727c762311
commit 19508dd192
2 changed files with 0 additions and 45 deletions
--- a/README.md
+++ b/README.md
@@ -1864,11 +1864,6 @@ The following extractors use this feature:
 #### digitalconcerthall
 * `prefer_combined_hls`: Prefer extracting combined/pre-merged video and audio HLS formats. This will exclude 4K/HEVC video and lossless/FLAC audio formats, which are only available as split video/audio HLS formats

-#### mixchmovie
-
-* `max_comments`: Maximum number of comments to extract - default is `120`. The final amount of comments is less than the limit because gifts are filtered.
-* `fetch_interval_sec`: Comment json files fetching interval. If `max_comments` is set too large, fetch interval need to be limit
-
 **Note**: These options may be changed/removed in the future without concern for backward compatibility

 <!-- MANPAGE: MOVE "INSTALLATION" SECTION HERE -->
--- a/yt_dlp/extractor/mixch.py
+++ b/yt_dlp/extractor/mixch.py
@@ -3,7 +3,6 @@ from ..networking.exceptions import HTTPError
 from ..utils import (
    ExtractorError,
    UserNotLive,
-    bool_or_none,
    int_or_none,
    str_or_none,
    url_or_none,
@@ -169,43 +168,4 @@ class MixchMovieIE(InfoExtractor):
                'uploader_url': ('ownerInfo', 'id', {lambda x: x and f'https://mixch.tv/u/{x}'}),
            }),
            'live_status': 'not_live',
-            '__post_extractor': self.extract_comments(video_id),
        }
-
-    def _get_comments(self, video_id):
-        # Comments are organized in a json chain, connected with 'nextCursor' property.
-        # There are up to 20 comments in one json file.
-        COMMENTS_LIMIT = 20
-        # If json files are downloaded too frequently, the server might ban all the access from your IP.
-        comments_left = int_or_none(self._configuration_arg('max_comments', [''])[0]) or 120
-        fetch_interval_sec = int_or_none(self._configuration_arg('fetch_interval_sec', [''])[0])
-
-        base_url = f'https://mixch.tv/api-web/movies/{video_id}/comments'
-        has_next = True
-        next_cursor = ''
-        fragment = 1
-
-        while has_next and (comments_left > 0):
-            data = self._download_json(
-                base_url, video_id,
-                note=f'Downloading comments, fragment {fragment}', errnote='Failed to download comments',
-                query={'cursor': next_cursor, 'limit': COMMENTS_LIMIT})
-            fragment += 1
-            comments_left -= COMMENTS_LIMIT
-
-            # Some of the 'comments' are not real comments but gifts.
-            # Only real comments are extracted here.
-            yield from traverse_obj(data, ('comments', lambda _, v: v['comment'], {
-                'author': ('user_name', {str}),
-                'author_id': ('user_id', {int_or_none}),
-                'author_thumbnail': ('profile_image_url', {url_or_none}),
-                'id': ('id', {int_or_none}),
-                'text': ('comment', {str_or_none}),
-                'timestamp': ('created', {int_or_none}),
-            }))
-
-            if fetch_interval_sec:
-                self._sleep(fetch_interval_sec, video_id)
-
-            has_next = traverse_obj(data, ('hasNext'), {bool_or_none})
-            next_cursor = traverse_obj(data, ('nextCursor'), {str_or_none})