mirror of
https://github.com/KoboldAI/KoboldAI-Client.git
synced 2025-02-27 08:57:46 +01:00
breakmodel fix for models without lm_head
This commit is contained in:
parent
8bfcf86a8b
commit
e00d9c4362
@ -383,9 +383,10 @@ if(not vars.model in ["InferKit", "Colab", "OAI", "ReadOnly"]):
|
|||||||
breakmodel.total_blocks = n_layers
|
breakmodel.total_blocks = n_layers
|
||||||
model.half().to('cpu')
|
model.half().to('cpu')
|
||||||
gc.collect()
|
gc.collect()
|
||||||
model.lm_head.to(breakmodel.gpu_device)
|
|
||||||
model.transformer.wte.to(breakmodel.gpu_device)
|
model.transformer.wte.to(breakmodel.gpu_device)
|
||||||
model.transformer.ln_f.to(breakmodel.gpu_device)
|
model.transformer.ln_f.to(breakmodel.gpu_device)
|
||||||
|
if(hasattr(model), 'lm_head'):
|
||||||
|
model.lm_head.to(breakmodel.gpu_device)
|
||||||
if(not hasattr(model.config, 'rotary') or not model.config.rotary):
|
if(not hasattr(model.config, 'rotary') or not model.config.rotary):
|
||||||
model.transformer.wpe.to(breakmodel.gpu_device)
|
model.transformer.wpe.to(breakmodel.gpu_device)
|
||||||
gc.collect()
|
gc.collect()
|
||||||
@ -433,9 +434,10 @@ if(not vars.model in ["InferKit", "Colab", "OAI", "ReadOnly"]):
|
|||||||
breakmodel.total_blocks = n_layers
|
breakmodel.total_blocks = n_layers
|
||||||
model.half().to('cpu')
|
model.half().to('cpu')
|
||||||
gc.collect()
|
gc.collect()
|
||||||
model.lm_head.to(breakmodel.gpu_device)
|
|
||||||
model.transformer.wte.to(breakmodel.gpu_device)
|
model.transformer.wte.to(breakmodel.gpu_device)
|
||||||
model.transformer.ln_f.to(breakmodel.gpu_device)
|
model.transformer.ln_f.to(breakmodel.gpu_device)
|
||||||
|
if(hasattr(model), 'lm_head'):
|
||||||
|
model.lm_head.to(breakmodel.gpu_device)
|
||||||
if(not hasattr(model.config, 'rotary') or not model.config.rotary):
|
if(not hasattr(model.config, 'rotary') or not model.config.rotary):
|
||||||
model.transformer.wpe.to(breakmodel.gpu_device)
|
model.transformer.wpe.to(breakmodel.gpu_device)
|
||||||
gc.collect()
|
gc.collect()
|
||||||
|
Loading…
x
Reference in New Issue
Block a user