polpoDevs commited on
Commit
12b8ccb
·
verified ·
1 Parent(s): b49cf9a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -45,7 +45,8 @@ def generate_with_llama_chat(my_config):
45
  repetition_penalty=repetition_penalty,
46
  #max_length=2000,
47
  max_new_tokens=max_new_tokens,
48
- model_kwargs={"device_map": "auto","load_in_8bit": True}) #, "src_lang": "en", "tgt_lang": "nl"}) does not work!
 
49
  end_time = time.time()
50
  elapsed_time = end_time - start_time
51
  print(f"Loading the model: {elapsed_time} seconds")
 
45
  repetition_penalty=repetition_penalty,
46
  #max_length=2000,
47
  max_new_tokens=max_new_tokens,
48
+ #model_kwargs={"device_map": "auto","load_in_8bit": True}
49
+ ) #, "src_lang": "en", "tgt_lang": "nl"}) does not work!
50
  end_time = time.time()
51
  elapsed_time = end_time - start_time
52
  print(f"Loading the model: {elapsed_time} seconds")