EITD commited on
Commit
43f9110
·
1 Parent(s): fcb5285
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -9,12 +9,12 @@ For more information on `huggingface_hub` Inference API support, please check th
9
  # client = InferenceClient("EITD/lora_model", token=os.getenv("HF_TOKEN"))
10
 
11
  model_name = "EITD/lora_model"
12
- quantization_config = BitsAndBytesConfig(
13
  load_in_4bit=True
14
  )
15
  model = AutoPeftModelForCausalLM.from_pretrained(
16
  model_name,
17
- quantization_config=quantization_config
18
  )
19
  tokenizer = AutoTokenizer.from_pretrained(model_name)
20
 
 
9
  # client = InferenceClient("EITD/lora_model", token=os.getenv("HF_TOKEN"))
10
 
11
  model_name = "EITD/lora_model"
12
+ bnb_config = BitsAndBytesConfig(
13
  load_in_4bit=True
14
  )
15
  model = AutoPeftModelForCausalLM.from_pretrained(
16
  model_name,
17
+ quantization_config=bnb_config
18
  )
19
  tokenizer = AutoTokenizer.from_pretrained(model_name)
20