Spaces:

one1cat
/

CFR49_LLM

Sleeping

App Files Files Community

Armando Medina commited on 30 days ago

Commit

86e8c59

1 Parent(s): 16db460

updates

Browse files

Files changed (1) hide show

app.py +8 -16

app.py CHANGED Viewed

@@ -1,24 +1,16 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, check:
-https://huggingface.co/docs/huggingface_hub/en/guides/inference
-"""
-# Initialize the Inference API Client with your model
-client = InferenceClient("one1cat/FineTunes_LLM_CFR_49")
 def respond(message, history, system_message, max_tokens, temperature, top_p):
     """
-    Generates responses using the fine-tuned CFR 49 model.
     """
-    # Format prompt
     prompt = f"{system_message}\n\nUser: {message}\n\nAssistant:"
-    # Generate response
     response = ""
     try:
@@ -27,20 +19,20 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
             max_new_tokens=max_tokens,
             temperature=temperature,
             top_p=top_p,
-            stream=True,  # Enables token streaming
         ):
             response += token
-            yield response
     except Exception as e:
-        yield f"Error: {str(e)}"
-# Gradio Chat Interface
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
-        gr.Textbox(value="You are an AI trained on CFR 49 regulations.", label="System message"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p (nucleus sampling)"),

 import gradio as gr
 from huggingface_hub import InferenceClient
+# 🔹 Initialize Hugging Face Inference Client
+client = InferenceClient(model="one1cat/FineTunes_LLM_CFR_49")
 def respond(message, history, system_message, max_tokens, temperature, top_p):
     """
+    Generates responses using the fine-tuned CFR 49 model hosted on Hugging Face.
     """
     prompt = f"{system_message}\n\nUser: {message}\n\nAssistant:"
     response = ""
     try:
             max_new_tokens=max_tokens,
             temperature=temperature,
             top_p=top_p,
+            stream=True,  # Enables real-time streaming output
         ):
             response += token
+            yield response  # Stream response token by token
     except Exception as e:
+        yield f"Error: {str(e)}"  # Handle potential API errors
+# 🔹 Gradio Chat Interface
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
+        gr.Textbox(value="You are a CFR 49 regulatory compliance assistant.", label="System message"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p (nucleus sampling)"),