Merge pull request #367 from 0cc4m/4bit-plugin

GPTQ module
This commit is contained in:
henk717
2023-07-23 22:32:20 +02:00
committed by GitHub
10 changed files with 344 additions and 8 deletions

View File

@@ -17,9 +17,12 @@ from transformers import (
StoppingCriteria,
GPTNeoForCausalLM,
GPT2LMHeadModel,
AutoModelForCausalLM,
LogitsProcessorList,
)
try:
from hf_bleeding_edge import AutoModelForCausalLM
except ImportError:
from transformers import AutoModelForCausalLM
import utils
import modeling.lazy_loader as lazy_loader