diff --git a/modeling/inference_models/generic_hf_torch/class.py b/modeling/inference_models/generic_hf_torch/class.py index 1cc1a373..25d49214 100644 --- a/modeling/inference_models/generic_hf_torch/class.py +++ b/modeling/inference_models/generic_hf_torch/class.py @@ -81,7 +81,6 @@ class model_backend(HFTorchInferenceModel): tf_kwargs = { "low_cpu_mem_usage": True, - "pretraining_tp": 1, } if self.quantization == "8bit":