Spaces:

talhasideline
/

hockey-mind-db

Running

talhasideline commited on 12 days ago

Commit

a6a1c25

verified ·

1 Parent(s): 8ea01ce

Update Original_OpenAPI_DB.py

Files changed (1) hide show

Original_OpenAPI_DB.py CHANGED Viewed

@@ -143,7 +143,7 @@ hockey_keywords = [
     "midfielder", "middenvelder", "forward", "aanvaller", "striker", "spits", "player", "speler",
     "corner", "short corner", "penalty corner", "strafcorner", "free hit", "vrije slag",
     "tackle", "marking", "defending", "attacking", "skills", "technique", "techniek", "improve",
-    "tips", "advice", "help", "suggest", "recommendation", "better", "enhance"
 ]
 # Greetings for detection
@@ -316,7 +316,7 @@ def is_in_domain(prompt: str) -> bool:
                 similarity = util.cos_sim(prompt_embedding, hockey_embedding).item()
                 max_similarity = max(max_similarity, similarity)
-            has_hockey_semantic = max_similarity > 0.35  # Slightly higher threshold
             logging.debug(f"Hockey domain check for '{prompt}': keywords={has_hockey_keywords}, "
                          f"semantic={has_hockey_semantic} (score: {max_similarity:.3f})")
@@ -369,11 +369,11 @@ def is_greeting_or_vague(prompt: str, user_lang: str = "en") -> bool:
         return True
     # It's a greeting ONLY if:
-    # 1. High ratio of greeting words AND
     # 2. No hockey keywords AND
     # 3. No semantic hockey content
     is_pure_greeting = (
-        greeting_ratio > 0.7 and
         not has_hockey_keywords and
         not has_hockey_semantic
     )

     "midfielder", "middenvelder", "forward", "aanvaller", "striker", "spits", "player", "speler",
     "corner", "short corner", "penalty corner", "strafcorner", "free hit", "vrije slag",
     "tackle", "marking", "defending", "attacking", "skills", "technique", "techniek", "improve",
+    "tips", "advice", "help", "suggest", "better", "enhance"
 ]
 # Greetings for detection
                 similarity = util.cos_sim(prompt_embedding, hockey_embedding).item()
                 max_similarity = max(max_similarity, similarity)
+            has_hockey_semantic = max_similarity > 0.4  # Higher threshold to reduce false positives
             logging.debug(f"Hockey domain check for '{prompt}': keywords={has_hockey_keywords}, "
                          f"semantic={has_hockey_semantic} (score: {max_similarity:.3f})")
         return True
     # It's a greeting ONLY if:
+    # 1. High ratio of greeting words (>50% for multi-word, or single greeting word) AND
     # 2. No hockey keywords AND
     # 3. No semantic hockey content
     is_pure_greeting = (
+        (greeting_ratio >= 0.5 or (total_words <= 2 and greeting_words)) and
         not has_hockey_keywords and
         not has_hockey_semantic
     )