EITD commited on
Commit
5acd05f
·
1 Parent(s): f7837ea
Files changed (1) hide show
  1. app.py +1 -4
app.py CHANGED
@@ -9,12 +9,9 @@ For more information on `huggingface_hub` Inference API support, please check th
9
  # client = InferenceClient("EITD/lora_model", token=os.getenv("HF_TOKEN"))
10
 
11
  model_name = "EITD/lora_model"
12
- quantization_config = BitsAndBytesConfig(
13
- load_in_4bit=True
14
- )
15
  model = AutoPeftModelForCausalLM.from_pretrained(
16
  model_name,
17
- quantization_config=quantization_config
18
  )
19
  tokenizer = AutoTokenizer.from_pretrained(model_name)
20
 
 
9
  # client = InferenceClient("EITD/lora_model", token=os.getenv("HF_TOKEN"))
10
 
11
  model_name = "EITD/lora_model"
 
 
 
12
  model = AutoPeftModelForCausalLM.from_pretrained(
13
  model_name,
14
+ load_in_4bit = True,
15
  )
16
  tokenizer = AutoTokenizer.from_pretrained(model_name)
17