qwen2.5-coder-generate

Sleeping

quan1998 commited on Jan 16

Commit

3f05231

verified ·

1 Parent(s): e66ae77

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,26 +14,26 @@ client = InferenceClient("Qwen/Qwen2.5-Coder-32B-Instruct")
 client = InferenceClient("Qwen/Qwen2.5-Coder-32B-Instruct")
-def greet(messages):
     response = ""
-    for message in client.chat_completion(
-        messages,
         stream=True,
-        max_tokens=1024,
         temperature=0.7,
         top_p=0.95
     ):
-        token = message.choices[0].delta.content
         response += token
         yield response
 demo = gr.Interface(
     fn=greet,
     inputs=[
-        gr.JSON(value=[{"role": "user", "content": "Bạn là AI"}])
     ],
     outputs=[gr.Textbox(label="result", lines=3)],
-    api_name="chat",
     clear_btn=None
 )

 client = InferenceClient("Qwen/Qwen2.5-Coder-32B-Instruct")
+def greet(message):
     response = ""
+    for token in client.text_generation(
+        message,
         stream=True,
+        max_new_tokens=12,
         temperature=0.7,
         top_p=0.95
     ):
+        print(token)
         response += token
         yield response
 demo = gr.Interface(
     fn=greet,
     inputs=[
+        gr.Textbox(label="message", value="The huggingface_hub library is ")
     ],
     outputs=[gr.Textbox(label="result", lines=3)],
+    api_name="generate",
     clear_btn=None
 )