Spaces:

codeblacks
/

deepseek

Sleeping

codeblacks commited on Jan 20

Commit

055366b

verified ·

1 Parent(s): 4a29d0e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 """
@@ -7,7 +8,7 @@ For more information on `huggingface_hub` Inference API support, please check th
 client = InferenceClient("microsoft/Phi-3.5-mini-instruct")
-def respond(
     message,
     history: list[tuple[str, str]],
     system_message,
@@ -27,7 +28,7 @@ def respond(
     response = ""
-    for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
@@ -59,6 +60,6 @@ demo = gr.ChatInterface(
     ],
 )
 if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
+import asyncio
 from huggingface_hub import InferenceClient
 """
 client = InferenceClient("microsoft/Phi-3.5-mini-instruct")
+async def respond(
     message,
     history: list[tuple[str, str]],
     system_message,
     response = ""
+    async for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
     ],
 )
+# Launch the app with concurrency for 4 users
 if __name__ == "__main__":
+    demo.queue(concurrency_count=4).launch()