Merge commit 'refs/pull/352/head' of https://github.com/ebolam/KoboldAI into UI2

2025-06-05 21:59:24 +02:00 · 2022-12-20 21:24:06 -05:00
parent 4b53126d29 2a949cbe2a
commit 1500d07c38
6 changed files with 43 additions and 33 deletions
--- a/aiserver.py
+++ b/aiserver.py
@@ -2291,13 +2291,11 @@ def patch_transformers():

    from torch.nn import functional as F

-    class ProbabilityVisualizerLogitsProcessor(LogitsProcessor):
-        def __init__(self):
-            pass
+    def visualize_probabilities(scores: torch.FloatTensor) -> None:
+        assert scores.ndim == 2

-        def __call__(self, input_ids: torch.LongTensor, scores: torch.FloatTensor) -> torch.FloatTensor:
-            assert scores.ndim == 2
-            assert input_ids.ndim == 2
+        if vars.numseqs > 1 or not vars.show_probs:
+            return

            if not koboldai_vars.show_probs:
                return scores
@@ -2332,7 +2330,6 @@ def patch_transformers():
        processors = new_get_logits_processor.old_get_logits_processor(*args, **kwargs)
        processors.insert(0, LuaLogitsProcessor())
        processors.append(PhraseBiasLogitsProcessor())
-        processors.append(ProbabilityVisualizerLogitsProcessor())
        return processors
    use_core_manipulations.get_logits_processor =  new_get_logits_processor
    new_get_logits_processor.old_get_logits_processor = transformers.generation_utils.GenerationMixin._get_logits_processor
@@ -2354,6 +2351,7 @@ def patch_transformers():
                sampler_order = [6] + sampler_order
            for k in sampler_order:
                scores = self.__warper_list[k](input_ids, scores, *args, **kwargs)
+            visualize_probabilities(scores)
            return scores

    def new_get_logits_warper(beams: int = 1,) -> LogitsProcessorList:
@@ -2889,6 +2887,7 @@ def load_model(use_gpu=True, gpu_layers=None, disk_layers=None, initial_load=Fal
                    with zipfile.ZipFile(f, "r") as z:
                        try:
                            last_storage_key = None
+                            zipfolder = os.path.basename(os.path.normpath(f)).split('.')[0]
                            f = None
                            current_offset = 0
                            able_to_pin_layers = True
@@ -2900,7 +2899,10 @@ def load_model(use_gpu=True, gpu_layers=None, disk_layers=None, initial_load=Fal
                                    last_storage_key = storage_key
                                    if isinstance(f, zipfile.ZipExtFile):
                                        f.close()
-                                    f = z.open(f"archive/data/{storage_key}")
+                                    try:
+                                        f = z.open(f"archive/data/{storage_key}")
+                                    except:
+                                        f = z.open(f"{zipfolder}/data/{storage_key}")
                                    current_offset = 0
                                if current_offset != model_dict[key].seek_offset:
                                    f.read(model_dict[key].seek_offset - current_offset)