Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -1,89 +1,72 @@
|
|
| 1 |
import gradio as gr
|
| 2 |
-
import chromadb
|
| 3 |
-
from sentence_transformers import SentenceTransformer
|
| 4 |
from llama_cpp import Llama
|
| 5 |
|
| 6 |
-
#
|
| 7 |
-
chroma_client = chromadb.PersistentClient(path="./chromadb_store")
|
| 8 |
-
collection = chroma_client.get_or_create_collection(name="curly_strings_knowledge")
|
| 9 |
-
|
| 10 |
-
# ✅ Load Local Embedding Model
|
| 11 |
-
embedder = SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")
|
| 12 |
-
|
| 13 |
-
# ✅ Curly Strings Knowledge (Stored in ChromaDB as Vectors)
|
| 14 |
-
knowledge_base = [
|
| 15 |
-
{"id": "song_list", "text": """
|
| 16 |
-
Curly Strings is an Estonian folk band known for blending traditional and modern sounds.
|
| 17 |
-
Here are some of their popular songs:
|
| 18 |
-
1. Kalakesed
|
| 19 |
-
2. Kus mu süda on ...
|
| 20 |
-
3. Vitsalaul
|
| 21 |
-
4. Viimases jaamas
|
| 22 |
-
5. Salaja
|
| 23 |
-
6. Üle ilma
|
| 24 |
-
7. Šveits
|
| 25 |
-
8. Kallimale
|
| 26 |
-
9. Üksteist peab hoidma
|
| 27 |
-
10. Suuda öelda ei
|
| 28 |
-
"""},
|
| 29 |
-
{"id": "related_artists", "text": """
|
| 30 |
-
If you enjoy Curly Strings, you might also like:
|
| 31 |
-
- Trad.Attack!
|
| 32 |
-
- Eesti Raadio laululapsed
|
| 33 |
-
- Körsikud
|
| 34 |
-
- Karl-Erik Taukar
|
| 35 |
-
- Dag
|
| 36 |
-
"""},
|
| 37 |
-
{"id": "background", "text": """
|
| 38 |
-
Curly Strings started in Estonia and became famous for their unique blend of folk and contemporary music.
|
| 39 |
-
They often perform at international festivals and are known for their emotional and poetic lyrics.
|
| 40 |
-
"""}
|
| 41 |
-
]
|
| 42 |
-
|
| 43 |
-
# ✅ Store Knowledge in ChromaDB (If Not Already Stored)
|
| 44 |
-
existing_data = collection.get()
|
| 45 |
-
if not existing_data["ids"]:
|
| 46 |
-
for item in knowledge_base:
|
| 47 |
-
embedding = embedder.encode(item["text"]).tolist()
|
| 48 |
-
collection.add(documents=[item["text"]], embeddings=[embedding], ids=[item["id"]])
|
| 49 |
-
|
| 50 |
-
# ✅ Load Llama Model
|
| 51 |
llm = Llama.from_pretrained(
|
| 52 |
repo_id="krishna195/second_guff",
|
| 53 |
filename="unsloth.Q4_K_M.gguf",
|
| 54 |
)
|
| 55 |
|
| 56 |
-
#
|
| 57 |
-
def retrieve_context(query):
|
| 58 |
-
query_embedding = embedder.encode(query).tolist()
|
| 59 |
-
results = collection.query(query_embeddings=[query_embedding], n_results=2)
|
| 60 |
-
|
| 61 |
-
# Flatten nested lists and ensure only strings are returned
|
| 62 |
-
retrieved_texts = [doc for sublist in results.get("documents", []) for doc in sublist if isinstance(doc, str)]
|
| 63 |
-
|
| 64 |
-
return "\n".join(retrieved_texts) if retrieved_texts else "No relevant data found."
|
| 65 |
-
|
| 66 |
-
# ✅ Chatbot Function with ChromaDB-RAG
|
| 67 |
def chatbot_response(user_input):
|
| 68 |
-
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 75 |
|
|
|
|
| 76 |
response = llm.create_chat_completion(
|
| 77 |
-
messages=
|
|
|
|
|
|
|
|
|
|
| 78 |
temperature=0.5,
|
| 79 |
-
max_tokens=
|
| 80 |
top_p=0.9,
|
| 81 |
frequency_penalty=0.8,
|
| 82 |
)
|
| 83 |
|
| 84 |
return response["choices"][0]["message"]["content"].strip()
|
| 85 |
|
| 86 |
-
#
|
| 87 |
iface = gr.Interface(
|
| 88 |
fn=chatbot_response,
|
| 89 |
inputs=gr.Textbox(placeholder="Ask me about Curly Strings..."),
|
|
@@ -93,5 +76,5 @@ iface = gr.Interface(
|
|
| 93 |
theme="compact",
|
| 94 |
)
|
| 95 |
|
| 96 |
-
#
|
| 97 |
-
iface.launch()
|
|
|
|
| 1 |
import gradio as gr
|
|
|
|
|
|
|
| 2 |
from llama_cpp import Llama
|
| 3 |
|
| 4 |
+
# Load the Llama model
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5 |
llm = Llama.from_pretrained(
|
| 6 |
repo_id="krishna195/second_guff",
|
| 7 |
filename="unsloth.Q4_K_M.gguf",
|
| 8 |
)
|
| 9 |
|
| 10 |
+
# Define the chatbot function
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 11 |
def chatbot_response(user_input):
|
| 12 |
+
# System instructions
|
| 13 |
+
system_prompt = """
|
| 14 |
+
You are a chatbot specializing in recommending songs by the Estonian folk band **Curly Strings**.
|
| 15 |
+
based on this anw the question and give the link of the source
|
| 16 |
+
## 🎵 **Song List**
|
| 17 |
+
Here are some songs by Curly Strings:
|
| 18 |
+
1. **Kalakesed**
|
| 19 |
+
2. **Kus mu süda on ...**
|
| 20 |
+
3. **Vitsalaul**
|
| 21 |
+
4. **Viimases jaamas**
|
| 22 |
+
5. **Salaja**
|
| 23 |
+
6. **Üle ilma**
|
| 24 |
+
7. **Šveits**
|
| 25 |
+
8. **Kallimale**
|
| 26 |
+
9. **Üksteist peab hoidma**
|
| 27 |
+
10. **Suuda öelda ei**
|
| 28 |
+
11. **Annan käe**
|
| 29 |
+
12. **Tulbid ja Bonsai**
|
| 30 |
+
13. **Tüdruk Pika Kleidiga**
|
| 31 |
+
14. **Armasta mind (feat. Vaiko Eplik)**
|
| 32 |
+
15. **Minu, Pets, Margus ja Priit**
|
| 33 |
+
16. **Kauges külas**
|
| 34 |
+
17. **Tule ja jää**
|
| 35 |
+
18. **Kuutõbine**
|
| 36 |
+
19. **Omaenese ilus ja veas**
|
| 37 |
+
20. **Pulmad**
|
| 38 |
+
21. **Pillimeeste laul**
|
| 39 |
+
22. **Tehke ruumi!**
|
| 40 |
+
## 🎤 **Related Artists**
|
| 41 |
+
If you enjoy Curly Strings, you might also like:
|
| 42 |
+
- **Trad.Attack!**
|
| 43 |
+
- **Eesti Raadio laululapsed**
|
| 44 |
+
- **Körsikud**
|
| 45 |
+
- **Karl-Erik Taukar**
|
| 46 |
+
- **Dag**
|
| 47 |
+
- **Sadamasild**
|
| 48 |
+
- **Kruuv**
|
| 49 |
+
- **Smilers**
|
| 50 |
+
- **Mari Jürjens**
|
| 51 |
+
- **Terminaator**
|
| 52 |
+
---
|
| 53 |
+
"""
|
| 54 |
|
| 55 |
+
# Generate response from Llama model
|
| 56 |
response = llm.create_chat_completion(
|
| 57 |
+
messages=[
|
| 58 |
+
{"role": "system", "content": system_prompt},
|
| 59 |
+
{"role": "user", "content": user_input}
|
| 60 |
+
],
|
| 61 |
temperature=0.5,
|
| 62 |
+
max_tokens=1000, # Increased for better answers
|
| 63 |
top_p=0.9,
|
| 64 |
frequency_penalty=0.8,
|
| 65 |
)
|
| 66 |
|
| 67 |
return response["choices"][0]["message"]["content"].strip()
|
| 68 |
|
| 69 |
+
# Create Gradio interface
|
| 70 |
iface = gr.Interface(
|
| 71 |
fn=chatbot_response,
|
| 72 |
inputs=gr.Textbox(placeholder="Ask me about Curly Strings..."),
|
|
|
|
| 76 |
theme="compact",
|
| 77 |
)
|
| 78 |
|
| 79 |
+
# Launch the Gradio app
|
| 80 |
+
iface.launch()
|