Spaces:
Paused
Paused
Upload 2 files
Browse files- app.py +1 -3
- requirements.txt +0 -2
app.py
CHANGED
|
@@ -15,7 +15,6 @@ torch.set_float32_matmul_precision("high")
|
|
| 15 |
HF_TOKEN = os.getenv("HF_TOKEN", None)
|
| 16 |
#REPO_ID = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
|
| 17 |
REPO_ID = "nicoboss/DeepSeek-R1-Distill-Qwen-32B-Uncensored"
|
| 18 |
-
#REPO_ID = "Qwen/QwQ-32B"
|
| 19 |
|
| 20 |
DESCRIPTION = f'''
|
| 21 |
<div>
|
|
@@ -71,8 +70,7 @@ def chat(message: str,
|
|
| 71 |
messages.append({"role": "system", "content": sys_prompt})
|
| 72 |
messages.append({"role": "user", "content": message})
|
| 73 |
|
| 74 |
-
|
| 75 |
-
input_tensors = tokenizer.apply_chat_template(messages, add_generation_prompt=True, return_dict=True, return_tensors="pt").to(model.device)
|
| 76 |
|
| 77 |
input_ids = input_tensors["input_ids"]
|
| 78 |
attention_mask = input_tensors["attention_mask"]
|
|
|
|
| 15 |
HF_TOKEN = os.getenv("HF_TOKEN", None)
|
| 16 |
#REPO_ID = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
|
| 17 |
REPO_ID = "nicoboss/DeepSeek-R1-Distill-Qwen-32B-Uncensored"
|
|
|
|
| 18 |
|
| 19 |
DESCRIPTION = f'''
|
| 20 |
<div>
|
|
|
|
| 70 |
messages.append({"role": "system", "content": sys_prompt})
|
| 71 |
messages.append({"role": "user", "content": message})
|
| 72 |
|
| 73 |
+
input_tensors = tokenizer.apply_chat_template([{"role": x["role"], "content": x["content"]} for x in history] + messages, add_generation_prompt=True, return_dict=True, add_special_tokens=False, return_tensors="pt").to(model.device)
|
|
|
|
| 74 |
|
| 75 |
input_ids = input_tensors["input_ids"]
|
| 76 |
attention_mask = input_tensors["attention_mask"]
|
requirements.txt
CHANGED
|
@@ -6,6 +6,4 @@ git+https://github.com/huggingface/transformers
|
|
| 6 |
numpy<2
|
| 7 |
sentencepiece
|
| 8 |
triton
|
| 9 |
-
optimum
|
| 10 |
-
optimum-quanto
|
| 11 |
bitsandbytes
|
|
|
|
| 6 |
numpy<2
|
| 7 |
sentencepiece
|
| 8 |
triton
|
|
|
|
|
|
|
| 9 |
bitsandbytes
|