This commit is contained in:
Henk
2023-07-22 15:25:14 +02:00
parent 7823da564e
commit fa9d17b3d3
4 changed files with 4 additions and 3 deletions

View File

@@ -81,6 +81,7 @@ class model_backend(HFTorchInferenceModel):
tf_kwargs = {
"low_cpu_mem_usage": True,
"pretraining_tp": 1,
}
if self.quantization == "8bit":