Spaces:

edouardfoussier
/

rag-rh-assistant

Sleeping

App Files Files Community

edouardfoussier commited on Aug 27

Commit

8853ea0

1 Parent(s): f095082

added Model dropdown in sidebar

Browse files

Files changed (2) hide show

app.py +15 -4
rag/synth.py +16 -4

app.py CHANGED Viewed

@@ -32,7 +32,7 @@ def add_user(user_msg: str, history: list[tuple]) -> tuple[str, list[tuple]]:
 # ---------- Chat step 2: stream assistant answer ----------
-def bot(history: list[tuple], api_key: str, top_k: int):
     """
     Yields (history, sources_markdown) while streaming.
     """
@@ -63,7 +63,7 @@ def bot(history: list[tuple], api_key: str, top_k: int):
     # Streaming LLM
     acc = ""
     try:
-        for chunk in synth_answer_stream(user_msg, hits[:k]):
             acc += chunk or ""
             step_hist = deepcopy(history)
             step_hist[-1] = (user_msg, acc)
@@ -109,6 +109,17 @@ with gr.Blocks(theme="soft", fill_height=True) as demo:
             type="password",
             placeholder="sk-… (optional if set in env)"
         )
         topk = gr.Slider(1, 10, value=5, step=1, label="Top-K passages")
         # you can wire this later; not used now
@@ -144,7 +155,7 @@ with gr.Blocks(theme="soft", fill_height=True) as demo:
     send_click = send.click(add_user, [msg, state], [msg, state])
     send_click.then(
         bot,
-        [state, api_key, topk],
         [chat, sources],
         show_progress="minimal",
     ).then(lambda h: h, chat, state)
@@ -152,7 +163,7 @@ with gr.Blocks(theme="soft", fill_height=True) as demo:
     msg_submit = msg.submit(add_user, [msg, state], [msg, state])
     msg_submit.then(
         bot,
-        [state, api_key, topk],
         [chat, sources],
         show_progress="minimal",
     ).then(lambda h: h, chat, state)

 # ---------- Chat step 2: stream assistant answer ----------
+def bot(history: list[tuple], api_key: str, top_k: int, model_name: str):
     """
     Yields (history, sources_markdown) while streaming.
     """
     # Streaming LLM
     acc = ""
     try:
+        for chunk in synth_answer_stream(user_msg, hits[:k], model=model_name):
             acc += chunk or ""
             step_hist = deepcopy(history)
             step_hist[-1] = (user_msg, acc)
             type="password",
             placeholder="sk-… (optional if set in env)"
         )
+        # let user choose the OpenAI model
+        model = gr.Dropdown(
+            label="⚙️ OpenAI model",
+            choices=[
+                "gpt-4o-mini",
+                "gpt-4o",
+                "gpt-4.1-mini",
+                "gpt-3.5-turbo"
+            ],
+            value="gpt-4o-mini"
+        )
         topk = gr.Slider(1, 10, value=5, step=1, label="Top-K passages")
         # you can wire this later; not used now
     send_click = send.click(add_user, [msg, state], [msg, state])
     send_click.then(
         bot,
+        [state, api_key, topk, model],
         [chat, sources],
         show_progress="minimal",
     ).then(lambda h: h, chat, state)
     msg_submit = msg.submit(add_user, [msg, state], [msg, state])
     msg_submit.then(
         bot,
+        [state, api_key, topk, model],
         [chat, sources],
         show_progress="minimal",
     ).then(lambda h: h, chat, state)

rag/synth.py CHANGED Viewed

@@ -8,6 +8,14 @@ from datetime import date
 LLM_MODEL = os.getenv("LLM_MODEL", "gpt-4o-mini")
 LLM_BASE_URL = os.getenv("LLM_BASE_URL", "https://api.openai.com/v1")
 def _build_prompt(query, passages):
     # Construire des blocs numérotés et balisés
@@ -26,12 +34,15 @@ def _build_prompt(query, passages):
     context = "\n\n".join(blocks)
     query = utf8_safe(query)
-    today = date.today().strftime("%d %B %Y")  # e.g. "27 août 2025"
     return (
         "Tu es un assistant RH chargé de répondre à des questions dans le domaine des ressources humaines en t'appuyant sur les sources fournies.\n"
-        "La date d'aujourd'hui est : {today}.\n\n"
         "Consignes :\n"
         "- Réponds de manière factuelle, concise et polie (vouvoiement).\n"
         "- Quand tu affirmes un fait, cite tes sources en fin de phrase avec le format [1], [2]… en te basant sur l'index de ces sources (ex: [1] est la source 1, [2] est la source 2, etc.)\n\n"
@@ -43,8 +54,9 @@ def _build_prompt(query, passages):
         "Réponse:"
     )
-def synth_answer_stream(query, passages):
     client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"), base_url=LLM_BASE_URL)
     prompt = utf8_safe(_build_prompt(query, passages))
     stream = client.chat.completions.create(

 LLM_MODEL = os.getenv("LLM_MODEL", "gpt-4o-mini")
 LLM_BASE_URL = os.getenv("LLM_BASE_URL", "https://api.openai.com/v1")
+# _MONTHS_FR = {
+#     1:"janvier", 2:"février", 3:"mars", 4:"avril", 5:"mai", 6:"juin",
+#     7:"juillet", 8:"août", 9:"septembre", 10:"octobre", 11:"novembre", 12:"décembre"
+# }
+# def today_fr():
+#     d = date.today()
+#     return f"{d.day} {_MONTHS_FR[d.month]} {d.year}"
 def _build_prompt(query, passages):
     # Construire des blocs numérotés et balisés
     context = "\n\n".join(blocks)
     query = utf8_safe(query)
+    today = date.today().strftime("%d %m %Y")  # e.g. "27 août 2025"
     return (
         "Tu es un assistant RH chargé de répondre à des questions dans le domaine des ressources humaines en t'appuyant sur les sources fournies.\n"
+        f"La date d'aujourd'hui est : {today} (au format AAAA-MM-JJ).\n\n"
+        "⚠️ Consigne temporelle : Les textes sources peuvent avoir été rédigés avant aujourd'hui "
+        "et mentionner des changements à venir. Interprète ces formulations en fonction de la date actuelle. "
+        "Si une mesure annoncée est déjà en vigueur aujourd'hui, écris-la au présent ou au passé, "
+        "jamais au futur.\n\n"
         "Consignes :\n"
         "- Réponds de manière factuelle, concise et polie (vouvoiement).\n"
         "- Quand tu affirmes un fait, cite tes sources en fin de phrase avec le format [1], [2]… en te basant sur l'index de ces sources (ex: [1] est la source 1, [2] est la source 2, etc.)\n\n"
         "Réponse:"
     )
+def synth_answer_stream(query, passages, model: str  | None = None):
     client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"), base_url=LLM_BASE_URL)
+    model = model or LLM_MODEL
     prompt = utf8_safe(_build_prompt(query, passages))
     stream = client.chat.completions.create(