Update app.py
Browse files
app.py
CHANGED
@@ -11,7 +11,7 @@ import asyncio
|
|
11 |
import gradio as gr
|
12 |
import torch
|
13 |
from dotenv import load_dotenv
|
14 |
-
from fastapi import FastAPI
|
15 |
from fastapi.responses import JSONResponse
|
16 |
import uvicorn
|
17 |
from threading import Thread
|
@@ -204,14 +204,10 @@ def get_best_response(responses):
|
|
204 |
best_response_index = total_similarities.argmax()
|
205 |
return responses[best_response_index]
|
206 |
|
207 |
-
async def generate_model_response(model, inputs
|
208 |
try:
|
209 |
response = model(inputs)
|
210 |
-
|
211 |
-
|
212 |
-
if len(text.split()) > max_tokens:
|
213 |
-
return text[:max_tokens]
|
214 |
-
return text
|
215 |
except Exception as e:
|
216 |
return ""
|
217 |
|
@@ -232,9 +228,10 @@ async def process_message(message):
|
|
232 |
app = FastAPI()
|
233 |
|
234 |
@app.post("/generate")
|
235 |
-
async def generate(request:
|
236 |
try:
|
237 |
-
|
|
|
238 |
return JSONResponse(content={"response": response})
|
239 |
except Exception as e:
|
240 |
return JSONResponse(content={"error": str(e)})
|
|
|
11 |
import gradio as gr
|
12 |
import torch
|
13 |
from dotenv import load_dotenv
|
14 |
+
from fastapi import FastAPI, Request
|
15 |
from fastapi.responses import JSONResponse
|
16 |
import uvicorn
|
17 |
from threading import Thread
|
|
|
204 |
best_response_index = total_similarities.argmax()
|
205 |
return responses[best_response_index]
|
206 |
|
207 |
+
async def generate_model_response(model, inputs):
|
208 |
try:
|
209 |
response = model(inputs)
|
210 |
+
return remove_duplicates(response['choices'][0]['text'])
|
|
|
|
|
|
|
|
|
211 |
except Exception as e:
|
212 |
return ""
|
213 |
|
|
|
228 |
app = FastAPI()
|
229 |
|
230 |
@app.post("/generate")
|
231 |
+
async def generate(request: Request):
|
232 |
try:
|
233 |
+
body = await request.json()
|
234 |
+
response = await process_message(body['message'])
|
235 |
return JSONResponse(content={"response": response})
|
236 |
except Exception as e:
|
237 |
return JSONResponse(content={"error": str(e)})
|