Model: And another refactor

2025-06-05 21:59:24 +02:00 · 2023-03-01 19:16:35 -06:00
parent 225dcf1a0a
commit 54cecd4d5d
18 changed files with 3045 additions and 2911 deletions
--- a/modeling/post_token_hooks.py
+++ b/modeling/post_token_hooks.py
@@ -0,0 +1,27 @@
+import torch
+
+import utils
+from modeling.inference_model import InferenceModel
+
+
+class PostTokenHooks:
+    @staticmethod
+    def stream_tokens(
+        model: InferenceModel,
+        input_ids: torch.LongTensor,
+    ) -> None:
+        if not model.gen_state["do_streaming"]:
+            return
+
+        if not utils.koboldai_vars.output_streaming:
+            return
+
+        data = [
+            utils.applyoutputformatting(
+                utils.decodenewlines(model.tokenizer.decode(x[-1])),
+                no_sentence_trimming=True,
+                no_single_line=True,
+            )
+            for x in input_ids
+        ]
+        utils.koboldai_vars.actions.stream_tokens(data)