Merge pull request #180 from VE-FORBRYDERNE/patch

Only enable TPU transpose optimization if loading from HF model
2025-06-05 21:59:24 +02:00 · 2022-11-21 20:02:14 +01:00
parent f2077b8e58 9a3f0eaab2
commit 04d9172fcd
1 changed files with 2 additions and 1 deletions
--- a/tpu_mtj_backend.py
+++ b/tpu_mtj_backend.py
@@ -1149,6 +1149,7 @@ def load_model(path: str, driver_version="tpu_driver0.1_dev20210607", hf_checkpo
            params[param] = default_params[param]
    # Use an optimization that will allow us to avoid one extra transpose operation
    if hf_checkpoint:
        params["transposed_linear"] = True
    # Load tokenizer