Spaces:
Runtime error
Runtime error
try
Browse files
app.py
CHANGED
@@ -9,12 +9,12 @@ For more information on `huggingface_hub` Inference API support, please check th
|
|
9 |
# client = InferenceClient("EITD/lora_model", token=os.getenv("HF_TOKEN"))
|
10 |
|
11 |
model_name = "EITD/lora_model"
|
12 |
-
|
13 |
load_in_4bit=True
|
14 |
)
|
15 |
model = AutoPeftModelForCausalLM.from_pretrained(
|
16 |
model_name,
|
17 |
-
quantization_config=
|
18 |
)
|
19 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
20 |
|
|
|
9 |
# client = InferenceClient("EITD/lora_model", token=os.getenv("HF_TOKEN"))
|
10 |
|
11 |
model_name = "EITD/lora_model"
|
12 |
+
bnb_config = BitsAndBytesConfig(
|
13 |
load_in_4bit=True
|
14 |
)
|
15 |
model = AutoPeftModelForCausalLM.from_pretrained(
|
16 |
model_name,
|
17 |
+
quantization_config=bnb_config
|
18 |
)
|
19 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
20 |
|