Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -45,7 +45,8 @@ def generate_with_llama_chat(my_config):
|
|
45 |
repetition_penalty=repetition_penalty,
|
46 |
#max_length=2000,
|
47 |
max_new_tokens=max_new_tokens,
|
48 |
-
model_kwargs={"device_map": "auto","load_in_8bit": True}
|
|
|
49 |
end_time = time.time()
|
50 |
elapsed_time = end_time - start_time
|
51 |
print(f"Loading the model: {elapsed_time} seconds")
|
|
|
45 |
repetition_penalty=repetition_penalty,
|
46 |
#max_length=2000,
|
47 |
max_new_tokens=max_new_tokens,
|
48 |
+
#model_kwargs={"device_map": "auto","load_in_8bit": True}
|
49 |
+
) #, "src_lang": "en", "tgt_lang": "nl"}) does not work!
|
50 |
end_time = time.time()
|
51 |
elapsed_time = end_time - start_time
|
52 |
print(f"Loading the model: {elapsed_time} seconds")
|