Linseypass commited on
Commit
a33b5ff
·
1 Parent(s): c448b10

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -11,12 +11,11 @@ import nltk
11
  nltk.download('punkt')
12
 
13
  # loads Guanaco 7B model - takes around 2-3 minutes - can do this separately
14
- model_name = "decapoda-research/llama-7b-hf"
15
  adapters_name = 'timdettmers/guanaco-7b'
16
  # print(f"Starting to load the model {model_name} into memory")
17
  m = AutoModelForCausalLM.from_pretrained(
18
- model_name,
19
- load_in_4bit=True)
20
  m = PeftModel.from_pretrained(m, adapters_name)
21
  #m = m.merge_and_unload()
22
  tok = LlamaTokenizer.from_pretrained(model_name)
 
11
  nltk.download('punkt')
12
 
13
  # loads Guanaco 7B model - takes around 2-3 minutes - can do this separately
14
+ model_name = "decapoda-research/llama-7b-hf-int4"
15
  adapters_name = 'timdettmers/guanaco-7b'
16
  # print(f"Starting to load the model {model_name} into memory")
17
  m = AutoModelForCausalLM.from_pretrained(
18
+ model_name)
 
19
  m = PeftModel.from_pretrained(m, adapters_name)
20
  #m = m.merge_and_unload()
21
  tok = LlamaTokenizer.from_pretrained(model_name)