mirror of
https://github.com/KoboldAI/KoboldAI-Client.git
synced 2025-06-05 21:59:24 +02:00
Not quite
This commit is contained in:
@@ -289,7 +289,8 @@ class HFTorchInferenceModel(HFInferenceModel):
|
||||
device_map = infer_auto_device_map(
|
||||
model,
|
||||
max_memory={0: "10GiB", 1: "7GiB", "cpu": "15GiB"},
|
||||
no_split_module_classes=["GPTJBlock"],
|
||||
no_split_module_classes=["GPTJBlock", "OPTDecoderLayer"],
|
||||
dtype="float16",
|
||||
)
|
||||
|
||||
return AutoModelForCausalLM.from_pretrained(
|
||||
|
Reference in New Issue
Block a user