Spaces:

shanthi-323
/

chatbot

Sleeping

shanthi-323 commited on Dec 11, 2024

Commit

d7eaedb

verified ·

1 Parent(s): f35ee3e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,24 +1,22 @@
 import streamlit as st
-from transformers import AutoModelForCausalLM, AutoTokenizer
-# Load the model and tokenizer
 @st.cache_resource
 def load_model():
-    model_name = "shanthi-323/lora_model_qnachatbot_cbt_q4_k_m"
-    tokenizer = AutoTokenizer.from_pretrained(model_name)
-    model = AutoModelForCausalLM.from_pretrained(model_name)
-    return tokenizer, model
-tokenizer, model = load_model()
-st.title("AI Chatbot")
-st.write("Chat with your fine-tuned model!")
 # User input
 user_input = st.text_input("You: ", placeholder="Type your message here...")
 if user_input:
-    inputs = tokenizer(user_input, return_tensors="pt")
-    outputs = model.generate(inputs["input_ids"], max_length=100)
-    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    st.text_area("Bot:", value=response, height=200, max_chars=None)

 import streamlit as st
+from llama_cpp import Llama
+# Load the GGUF model
 @st.cache_resource
 def load_model():
+    model_path = "shanthi-323/lora_model_qnachatbot_cbt_q4_k_m"  # Ensure this path matches your uploaded GGUF model file
+    return Llama(model_path=model_path)
+llm = load_model()
+st.title("Chat with GGUF Model")
+st.write("Start interacting with your fine-tuned chatbot!")
 # User input
 user_input = st.text_input("You: ", placeholder="Type your message here...")
 if user_input:
+    # Generate a response using llama-cpp-python
+    response = llm(user_input)
+    st.text_area("Bot:", value=response["choices"][0]["text"].strip(), height=200)