vl-7b-4bit

Runtime error

minhdang commited on Mar 22, 2024

Commit

f47bb74

verified ·

1 Parent(s): 02171c5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -271,9 +271,7 @@ def predict(
             response = strip_stop_words(full_response, stop_words)
             conversation.update_last_message(response)
             gradio_chatbot_output[-1][1] = response
-            yield gradio_chatbot_output, to_gradio_history(
-                conversation
-            ), "Generating..."
     print("flushed result to gradio")
     torch.cuda.empty_cache()
@@ -284,7 +282,7 @@ def predict(
             f"temperature: {temperature}, top_p: {top_p}, repetition_penalty: {repetition_penalty}, max_length_tokens: {max_length_tokens}"
         )
-    yield gradio_chatbot_output, to_gradio_history(conversation), "Generate: Success"
 def retry(

             response = strip_stop_words(full_response, stop_words)
             conversation.update_last_message(response)
             gradio_chatbot_output[-1][1] = response
+            yield gradio_chatbot_output, #to_gradio_history(conversation), "Generating..."
     print("flushed result to gradio")
     torch.cuda.empty_cache()
             f"temperature: {temperature}, top_p: {top_p}, repetition_penalty: {repetition_penalty}, max_length_tokens: {max_length_tokens}"
         )
+    yield gradio_chatbot_output,, "Generate: Success",# to_gradio_history(conversation)
 def retry(