tmberooney commited on
Commit
30b869f
·
1 Parent(s): 8079dc4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -22,7 +22,7 @@ from peft import PeftModel, PeftConfig
22
  from transformers import AutoModelForCausalLM, AutoTokenizer
23
 
24
  config = PeftConfig.from_pretrained("tmberooney/medstralchatbotgptq")
25
- model = AutoModelForCausalLM.from_pretrained("TheBloke/Mistral-7B-Instruct-v0.2-DARE-GPTQ")
26
  model = PeftModel.from_pretrained(model, "tmberooney/medstralchatbotgptq")
27
  tokenizer=AutoTokenizer.from_pretrained(config.base_model_name_or_path)
28
  device_map = {"transformer.word_embeddings": "cpu",
 
22
  from transformers import AutoModelForCausalLM, AutoTokenizer
23
 
24
  config = PeftConfig.from_pretrained("tmberooney/medstralchatbotgptq")
25
+ model = AutoModelForCausalLM.from_pretrained("TheBloke/Mistral-7B-Instruct-v0.2-DARE-GPTQ",load_in_4bit=True, torch_dtype=torch.float16, llm_int8_enable_fp32_cpu_offload=True)
26
  model = PeftModel.from_pretrained(model, "tmberooney/medstralchatbotgptq")
27
  tokenizer=AutoTokenizer.from_pretrained(config.base_model_name_or_path)
28
  device_map = {"transformer.word_embeddings": "cpu",