Spaces:

Asilbek14
/

zephyr-for-mobile

Sleeping

App Files Files Community

Asilbek14 commited on Aug 19

Commit

0a2169b

verified ·

1 Parent(s): 5f4efa7

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -11

app.py CHANGED Viewed

@@ -17,14 +17,18 @@ client = InferenceClient(MODEL_REPO)
 # ---------------- CHAT FUNCTION ----------------
 def stream_response(message, chat_history, system_message, max_tokens, temperature, top_p, response_style):
-    if response_style == "concise":
         system_message += " Keep answers short and direct."
-    elif response_style == "detailed":
         system_message += " Provide more explanation and context when helpful."
-    elif response_style == "essay":
         system_message += " Write long, structured, essay-style responses."
     messages = [{"role": "system", "content": system_message}]
     response = ""
     for msg in client.chat_completion(
@@ -50,8 +54,8 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="violet", secondary_hue="pink"))
     )
     chatbot = gr.Chatbot(
         height=500,
-        bubble_full_width=False,
         show_copy_button=True,
         label="Chat"
     )
@@ -71,22 +75,27 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="violet", secondary_hue="pink"))
             value=SYSTEM_PROMPT_DEFAULT,
             lines=3
         )
         temperature = gr.Slider(0.1, 1.5, value=TEMP_DEFAULT, step=0.1, label="Temperature")
         top_p = gr.Slider(0.1, 1.0, value=TOP_P_DEFAULT, step=0.05, label="Top-p")
         max_tokens = gr.Slider(32, 2048, value=MAX_NEW_TOKENS_DEFAULT, step=16, label="Max new tokens")
     # Events (streaming response)
     send_btn.click(
-    stream_response,
-    [msg, chatbot, system_prompt, max_tokens, temperature, top_p, response_style],
-    [msg, chatbot]
     )
     msg.submit(
-    stream_response,
-    [msg, chatbot, system_prompt, max_tokens, temperature, top_p, response_style],
-    [msg, chatbot]
     )
     clear_btn.click(lambda: None, None, chatbot, queue=False)
 if __name__ == "__main__":
-    demo.launch()

 # ---------------- CHAT FUNCTION ----------------
 def stream_response(message, chat_history, system_message, max_tokens, temperature, top_p, response_style):
+    if response_style == "Concise":
         system_message += " Keep answers short and direct."
+    elif response_style == "Detailed":
         system_message += " Provide more explanation and context when helpful."
+    elif response_style == "Essay":
         system_message += " Write long, structured, essay-style responses."
     messages = [{"role": "system", "content": system_message}]
+    for user, bot in chat_history:
+        messages.append({"role": "user", "content": user})
+        messages.append({"role": "assistant", "content": bot})
+    messages.append({"role": "user", "content": message})
     response = ""
     for msg in client.chat_completion(
     )
     chatbot = gr.Chatbot(
+        type="messages",  # ✅ new format
         height=500,
         show_copy_button=True,
         label="Chat"
     )
             value=SYSTEM_PROMPT_DEFAULT,
             lines=3
         )
+        response_style = gr.Dropdown(
+            ["Concise", "Detailed", "Essay"],
+            value="Concise",
+            label="Response Style"
+        )
         temperature = gr.Slider(0.1, 1.5, value=TEMP_DEFAULT, step=0.1, label="Temperature")
         top_p = gr.Slider(0.1, 1.0, value=TOP_P_DEFAULT, step=0.05, label="Top-p")
         max_tokens = gr.Slider(32, 2048, value=MAX_NEW_TOKENS_DEFAULT, step=16, label="Max new tokens")
     # Events (streaming response)
     send_btn.click(
+        stream_response,
+        [msg, chatbot, system_prompt, max_tokens, temperature, top_p, response_style],
+        [msg, chatbot]
     )
     msg.submit(
+        stream_response,
+        [msg, chatbot, system_prompt, max_tokens, temperature, top_p, response_style],
+        [msg, chatbot]
     )
     clear_btn.click(lambda: None, None, chatbot, queue=False)
 if __name__ == "__main__":
+    demo.launch()