mirror of
https://github.com/KoboldAI/KoboldAI-Client.git
synced 2025-01-10 07:20:04 +01:00
Only enable TPU transpose optimization if loading from HF model
This commit is contained in:
parent
f2077b8e58
commit
9a3f0eaab2
@ -1149,7 +1149,8 @@ def load_model(path: str, driver_version="tpu_driver0.1_dev20210607", hf_checkpo
|
||||
params[param] = default_params[param]
|
||||
|
||||
# Use an optimization that will allow us to avoid one extra transpose operation
|
||||
params["transposed_linear"] = True
|
||||
if hf_checkpoint:
|
||||
params["transposed_linear"] = True
|
||||
|
||||
# Load tokenizer
|
||||
if vars.model == "TPUMeshTransformerGPTNeoX":
|
||||
|
Loading…
Reference in New Issue
Block a user