Spaces:

vcasas
/

llama-index_tests

Runtime error

vcasas commited on Dec 8, 2024

Commit

b46dd63

verified ·

1 Parent(s): 88177fc

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -45,12 +45,28 @@ def create_article_embeddings(articles, model_name="paraphrase-multilingual-mpne
 # 4. Buscar el artículo relevante
 def find_article(question, article_keys, article_embeddings, model, articles):
-    """Busca el artículo más relevante para la pregunta utilizando embeddings."""
     question_embedding = model.encode(question, convert_to_tensor=True)
-    scores = util.pytorch_cos_sim(question_embedding, article_embeddings)
     best_match_idx = scores.argmax()
-    best_article_key = article_keys[best_match_idx]
-    return f"{best_article_key}\n{articles[best_article_key]}"
 # Flujo principal
 def main():

 # 4. Buscar el artículo relevante
 def find_article(question, article_keys, article_embeddings, model, articles):
+    # Filtrar artículos relevantes usando palabras clave
+    keywords = question.lower().split()  # Dividir pregunta en palabras clave
+    filtered_articles = {
+        key: value for key, value in articles.items()
+        if any(keyword in value.lower() for keyword in keywords)
+    }
+    if not filtered_articles:
+        # Si no hay artículos relevantes basados en palabras clave, usar todos
+        filtered_articles = articles
+    # Crear nuevos embeddings para los artículos filtrados
+    filtered_keys = list(filtered_articles.keys())
+    filtered_embeddings = model.encode(list(filtered_articles.values()), convert_to_tensor=True)
+    # Calcular similitud con la pregunta
     question_embedding = model.encode(question, convert_to_tensor=True)
+    scores = util.pytorch_cos_sim(question_embedding, filtered_embeddings)
     best_match_idx = scores.argmax()
+    best_article_key = filtered_keys[best_match_idx]
+    return f"{best_article_key}\n{filtered_articles[best_article_key]}"
 # Flujo principal
 def main():