Spaces:
Running
Running
Update retriever.py
Browse files- retriever.py +9 -3
retriever.py
CHANGED
@@ -2,7 +2,13 @@ import chromadb
|
|
2 |
from sentence_transformers import SentenceTransformer
|
3 |
import os
|
4 |
|
5 |
-
#
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
os.makedirs("/tmp/data", exist_ok=True)
|
7 |
|
8 |
# Initialize ChromaDB
|
@@ -10,8 +16,8 @@ os.makedirs("/tmp/data", exist_ok=True)
|
|
10 |
chroma_client = chromadb.EphemeralClient() # In-memory mode, resets on restart
|
11 |
|
12 |
|
13 |
-
# Load embedding model
|
14 |
-
embed_model = SentenceTransformer("
|
15 |
|
16 |
# Create collection (vector storage)
|
17 |
collection = chroma_client.get_or_create_collection(name="documents")
|
|
|
2 |
from sentence_transformers import SentenceTransformer
|
3 |
import os
|
4 |
|
5 |
+
# Set Hugging Face cache directory to a writable location
|
6 |
+
os.environ["HF_HOME"] = "/tmp/huggingface"
|
7 |
+
os.environ["TRANSFORMERS_CACHE"] = "/tmp/huggingface"
|
8 |
+
os.environ["SENTENCE_TRANSFORMERS_HOME"] = "/tmp/huggingface"
|
9 |
+
|
10 |
+
# Ensure /tmp directories exist
|
11 |
+
os.makedirs("/tmp/huggingface", exist_ok=True)
|
12 |
os.makedirs("/tmp/data", exist_ok=True)
|
13 |
|
14 |
# Initialize ChromaDB
|
|
|
16 |
chroma_client = chromadb.EphemeralClient() # In-memory mode, resets on restart
|
17 |
|
18 |
|
19 |
+
# Load embedding model - previously: sentence-transformers/
|
20 |
+
embed_model = SentenceTransformer("all-MiniLM-L6-v2")
|
21 |
|
22 |
# Create collection (vector storage)
|
23 |
collection = chroma_client.get_or_create_collection(name="documents")
|