mirror of
https://github.com/KoboldAI/KoboldAI-Client.git
synced 2025-06-05 21:59:24 +02:00
Changed alt_multi_gen to experimental and UI2 only
This commit is contained in:
10
aiserver.py
10
aiserver.py
@@ -2306,7 +2306,7 @@ def patch_transformers():
|
||||
option = koboldai_vars.actions.actions[koboldai_vars.actions.action_count+1]['Options'][x]
|
||||
if option['Pinned'] or option["Previous Selection"] or option["Edited"]:
|
||||
option_offset = x+1
|
||||
batch_offset = int((koboldai_vars.generated_tkns-1) / koboldai_vars.genamt) if koboldai_vars.alt_multi_gen else 0
|
||||
batch_offset = int((koboldai_vars.generated_tkns-1) / koboldai_vars.genamt) if koboldai_vars.alt_multi_gen and koboldai_vars.experimental_features else 0
|
||||
for batch_index, batch in enumerate(scores):
|
||||
probs = F.softmax(batch, dim = -1).cpu().numpy()
|
||||
|
||||
@@ -2489,7 +2489,7 @@ def patch_transformers():
|
||||
self.halt = not koboldai_vars.lua_koboldbridge.generating
|
||||
koboldai_vars.lua_koboldbridge.regeneration_required = False
|
||||
|
||||
for i in range(koboldai_vars.numseqs) if not koboldai_vars.alt_multi_gen else range(1):
|
||||
for i in range(koboldai_vars.numseqs) if not (koboldai_vars.alt_multi_gen and koboldai_vars.experimental_features) else range(1):
|
||||
koboldai_vars.lua_koboldbridge.generated[i+1][koboldai_vars.generated_tkns] = int(input_ids[i, -1].item())
|
||||
|
||||
return self.regeneration_required or self.halt
|
||||
@@ -5400,7 +5400,7 @@ def core_generate(text: list, _min: int, _max: int, found_entries: set, is_core:
|
||||
numseqs = koboldai_vars.numseqs
|
||||
total_gens = None
|
||||
|
||||
for i in range(koboldai_vars.numseqs if koboldai_vars.alt_multi_gen else 1):
|
||||
for i in range(koboldai_vars.numseqs if koboldai_vars.alt_multi_gen and koboldai_vars.experimental_features else 1):
|
||||
while True:
|
||||
# The reason this is a loop is due to how Dynamic WI works. We
|
||||
# cannot simply add the WI to the context mid-generation, so we
|
||||
@@ -5413,7 +5413,7 @@ def core_generate(text: list, _min: int, _max: int, found_entries: set, is_core:
|
||||
max_new=koboldai_vars.genamt,
|
||||
do_streaming=koboldai_vars.output_streaming,
|
||||
do_dynamic_wi=koboldai_vars.dynamicscan,
|
||||
batch_count=numseqs if not koboldai_vars.alt_multi_gen else 1,
|
||||
batch_count=numseqs if not (koboldai_vars.alt_multi_gen and koboldai_vars.experimental_features) else 1,
|
||||
# Real max length is handled by CoreStopper.
|
||||
bypass_hf_maxlength=koboldai_vars.dynamicscan,
|
||||
is_core=True,
|
||||
@@ -5425,7 +5425,7 @@ def core_generate(text: list, _min: int, _max: int, found_entries: set, is_core:
|
||||
already_generated += len(genout[0])
|
||||
|
||||
try:
|
||||
assert already_generated <= koboldai_vars.genamt * koboldai_vars.numseqs if koboldai_vars.alt_multi_gen else 1
|
||||
assert already_generated <= koboldai_vars.genamt * koboldai_vars.numseqs if koboldai_vars.alt_multi_gen and koboldai_vars.experimental_features else 1
|
||||
except AssertionError:
|
||||
print("AlreadyGenerated", already_generated)
|
||||
print("genamt", koboldai_vars.genamt)
|
||||
|
Reference in New Issue
Block a user