Hjgugugjhuhjggg commited on
Commit
0a97d8a
·
verified ·
1 Parent(s): 4e57921

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -9
app.py CHANGED
@@ -11,7 +11,7 @@ import asyncio
11
  import gradio as gr
12
  import torch
13
  from dotenv import load_dotenv
14
- from fastapi import FastAPI
15
  from fastapi.responses import JSONResponse
16
  import uvicorn
17
  from threading import Thread
@@ -204,14 +204,10 @@ def get_best_response(responses):
204
  best_response_index = total_similarities.argmax()
205
  return responses[best_response_index]
206
 
207
- async def generate_model_response(model, inputs, max_tokens=2048):
208
  try:
209
  response = model(inputs)
210
- text = remove_duplicates(response['choices'][0]['text'])
211
-
212
- if len(text.split()) > max_tokens:
213
- return text[:max_tokens]
214
- return text
215
  except Exception as e:
216
  return ""
217
 
@@ -232,9 +228,10 @@ async def process_message(message):
232
  app = FastAPI()
233
 
234
  @app.post("/generate")
235
- async def generate(request: BaseModel):
236
  try:
237
- response = await process_message(request.message)
 
238
  return JSONResponse(content={"response": response})
239
  except Exception as e:
240
  return JSONResponse(content={"error": str(e)})
 
11
  import gradio as gr
12
  import torch
13
  from dotenv import load_dotenv
14
+ from fastapi import FastAPI, Request
15
  from fastapi.responses import JSONResponse
16
  import uvicorn
17
  from threading import Thread
 
204
  best_response_index = total_similarities.argmax()
205
  return responses[best_response_index]
206
 
207
+ async def generate_model_response(model, inputs):
208
  try:
209
  response = model(inputs)
210
+ return remove_duplicates(response['choices'][0]['text'])
 
 
 
 
211
  except Exception as e:
212
  return ""
213
 
 
228
  app = FastAPI()
229
 
230
  @app.post("/generate")
231
+ async def generate(request: Request):
232
  try:
233
+ body = await request.json()
234
+ response = await process_message(body['message'])
235
  return JSONResponse(content={"response": response})
236
  except Exception as e:
237
  return JSONResponse(content={"error": str(e)})