mirror of
https://github.com/KoboldAI/KoboldAI-Client.git
synced 2025-06-05 21:59:24 +02:00
12
aiserver.py
12
aiserver.py
@@ -1716,10 +1716,11 @@ def patch_transformers():
|
|||||||
assert scores.ndim == 2
|
assert scores.ndim == 2
|
||||||
assert input_ids.ndim == 2
|
assert input_ids.ndim == 2
|
||||||
|
|
||||||
if koboldai_vars.numseqs > 1 or not koboldai_vars.show_probs:
|
if not koboldai_vars.show_probs:
|
||||||
return scores
|
return scores
|
||||||
|
|
||||||
probs = F.softmax(scores, dim = -1).cpu().numpy()[0]
|
for batch_index, batch in enumerate(scores):
|
||||||
|
probs = F.softmax(batch, dim = -1).cpu().numpy()
|
||||||
|
|
||||||
token_prob_info = []
|
token_prob_info = []
|
||||||
for token_id, score in sorted(enumerate(probs), key=lambda x: x[1], reverse=True)[:8]:
|
for token_id, score in sorted(enumerate(probs), key=lambda x: x[1], reverse=True)[:8]:
|
||||||
@@ -1729,7 +1730,12 @@ def patch_transformers():
|
|||||||
"score": float(score),
|
"score": float(score),
|
||||||
})
|
})
|
||||||
|
|
||||||
#koboldai_vars.token_stream_queue.probability_buffer = token_prob_info
|
|
||||||
|
if len(scores) == 1:
|
||||||
|
koboldai_vars.actions.set_probabilities(token_prob_info)
|
||||||
|
else:
|
||||||
|
koboldai_vars.actions.set_option_probabilities(token_prob_info, batch_index)
|
||||||
|
|
||||||
return scores
|
return scores
|
||||||
|
|
||||||
def new_get_logits_processor(*args, **kwargs) -> LogitsProcessorList:
|
def new_get_logits_processor(*args, **kwargs) -> LogitsProcessorList:
|
||||||
|
Reference in New Issue
Block a user