increase API version (+1 squashed commits)

Squashed commits: [c168c08] Added stop sequences functionality for API calls
2025-06-05 21:59:24 +02:00 · 2023-04-15 18:00:11 +08:00
parent ea8df4c0d3
commit 9705b7b79c
5 changed files with 35 additions and 1 deletions
--- a/modeling/stoppers.py
+++ b/modeling/stoppers.py
@@ -116,6 +116,33 @@ class Stoppers:
            return True
        return False

+    @staticmethod
+    def stop_sequence_stopper(
+        model: InferenceModel,
+        input_ids: torch.LongTensor,
+    ) -> bool:
+                
+        data = [model.tokenizer.decode(x) for x in input_ids]
+        # null_character = model.tokenizer.encode(chr(0))[0]
+        if "completed" not in model.gen_state:
+            model.gen_state["completed"] = [False] * len(input_ids)
+        
+        #one issue is that the stop sequence may not actual align with the end of token 
+        #if its a subsection of a longer token
+        for stopper in utils.koboldai_vars.stop_sequence:
+            for i in range(len(input_ids)):
+                if (
+                    data[i][-1 * (len(stopper)) :]
+                    == stopper
+                ):
+                    model.gen_state["completed"][i] = True
+
+        if all(model.gen_state["completed"]):
+            utils.koboldai_vars.generated_tkns = utils.koboldai_vars.genamt
+            del model.gen_state["completed"]
+            return True
+        return False
+
    @staticmethod
    def singleline_stopper(
        model: InferenceModel,