mirror of
https://github.com/KoboldAI/KoboldAI-Client.git
synced 2025-06-05 21:59:24 +02:00
Merge pull request #180 from VE-FORBRYDERNE/patch
Only enable TPU transpose optimization if loading from HF model
This commit is contained in:
@@ -1149,6 +1149,7 @@ def load_model(path: str, driver_version="tpu_driver0.1_dev20210607", hf_checkpo
|
|||||||
params[param] = default_params[param]
|
params[param] = default_params[param]
|
||||||
|
|
||||||
# Use an optimization that will allow us to avoid one extra transpose operation
|
# Use an optimization that will allow us to avoid one extra transpose operation
|
||||||
|
if hf_checkpoint:
|
||||||
params["transposed_linear"] = True
|
params["transposed_linear"] = True
|
||||||
|
|
||||||
# Load tokenizer
|
# Load tokenizer
|
||||||
|
Reference in New Issue
Block a user