Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -2,10 +2,10 @@ import gradio as gr
|
|
2 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
3 |
|
4 |
# Load model and tokenizer
|
5 |
-
model_name = "
|
6 |
|
7 |
-
tokenizer = AutoTokenizer.from_pretrained(model_name
|
8 |
-
model = AutoModelForCausalLM.from_pretrained(model_name
|
9 |
|
10 |
# Chat function
|
11 |
def chatbot(user_message, history):
|
@@ -20,7 +20,10 @@ def chatbot(user_message, history):
|
|
20 |
).to(model.device)
|
21 |
|
22 |
outputs = model.generate(**inputs, max_new_tokens=200)
|
23 |
-
response = tokenizer.decode(
|
|
|
|
|
|
|
24 |
|
25 |
history.append({"role": "user", "content": user_message})
|
26 |
history.append({"role": "assistant", "content": response})
|
@@ -29,7 +32,7 @@ def chatbot(user_message, history):
|
|
29 |
|
30 |
# Gradio UI
|
31 |
with gr.Blocks() as demo:
|
32 |
-
gr.Markdown("# 🤖
|
33 |
|
34 |
chatbot_ui = gr.Chatbot()
|
35 |
msg = gr.Textbox(placeholder="Type your message here...")
|
|
|
2 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
3 |
|
4 |
# Load model and tokenizer
|
5 |
+
model_name = "ibm-granite/granite-4.0-tiny-preview"
|
6 |
|
7 |
+
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
8 |
+
model = AutoModelForCausalLM.from_pretrained(model_name)
|
9 |
|
10 |
# Chat function
|
11 |
def chatbot(user_message, history):
|
|
|
20 |
).to(model.device)
|
21 |
|
22 |
outputs = model.generate(**inputs, max_new_tokens=200)
|
23 |
+
response = tokenizer.decode(
|
24 |
+
outputs[0][inputs["input_ids"].shape[-1]:],
|
25 |
+
skip_special_tokens=True
|
26 |
+
)
|
27 |
|
28 |
history.append({"role": "user", "content": user_message})
|
29 |
history.append({"role": "assistant", "content": response})
|
|
|
32 |
|
33 |
# Gradio UI
|
34 |
with gr.Blocks() as demo:
|
35 |
+
gr.Markdown("# 🤖 Granite-4.0 Tiny Chatbot")
|
36 |
|
37 |
chatbot_ui = gr.Chatbot()
|
38 |
msg = gr.Textbox(placeholder="Type your message here...")
|