Spaces:

kavg
/

sri-doc

Runtime error

kavg commited on May 4, 2024

Commit

80d398c

1 Parent(s): d0225fc

removed multiple ocr api calls

Files changed (2) hide show

main.py CHANGED Viewed

@@ -44,7 +44,8 @@ async def ProcessDocument(file: UploadFile):
     raise HTTPException(status_code=400, detail="Cannot apply OCR to the image")
   try:
     tokenClassificationOutput, img_size = LabelTokens(ocr_df, image)
-  except:
     raise HTTPException(status_code=400, detail="Entity identification failed")
   try:
@@ -98,23 +99,16 @@ def ApplyOCR(content):
     # printed_ocr_df.to_csv('temp/complete_image_ocr.csv', index=False)
     # return  printed_ocr_df, image
   except Exception as e:
     raise HTTPException(status_code=400, detail="Printed OCR process failed")
   try:
     trocr_client = ocr.TrOCRClient(config['settings'].TROCR_API_URL)
     handwritten_ocr_df = trocr_client.ocr(handwritten_imgs, image)
-  except:
     raise HTTPException(status_code=400, detail="handwritten OCR process failed")
-  try:
-    jpeg_bytes = io.BytesIO()
-    printed_img.save(jpeg_bytes, format='JPEG')
-    jpeg_content = jpeg_bytes.getvalue()
-    vision_client = ocr.VisionClient(config['settings'].GCV_AUTH)
-    printed_ocr_df = vision_client.ocr(jpeg_content, printed_img)
-  except:
-    raise HTTPException(status_code=400, detail="Printed OCR process failed")
   ocr_df = pd.concat([handwritten_ocr_df, printed_ocr_df])
   return ocr_df, image

     raise HTTPException(status_code=400, detail="Cannot apply OCR to the image")
   try:
     tokenClassificationOutput, img_size = LabelTokens(ocr_df, image)
+  except Exception as e:
+    print(e)
     raise HTTPException(status_code=400, detail="Entity identification failed")
   try:
     # printed_ocr_df.to_csv('temp/complete_image_ocr.csv', index=False)
     # return  printed_ocr_df, image
   except Exception as e:
+    print(e)
     raise HTTPException(status_code=400, detail="Printed OCR process failed")
   try:
     trocr_client = ocr.TrOCRClient(config['settings'].TROCR_API_URL)
     handwritten_ocr_df = trocr_client.ocr(handwritten_imgs, image)
+  except Exception as e:
+    print(e)
     raise HTTPException(status_code=400, detail="handwritten OCR process failed")
   ocr_df = pd.concat([handwritten_ocr_df, printed_ocr_df])
   return ocr_df, image

ocr.py CHANGED Viewed

@@ -12,6 +12,8 @@ image_ext = ("*.jpg", "*.jpeg", "*.png")
 class VisionClient:
     def __init__(self, auth):
         credentials = service_account.Credentials.from_service_account_info(
             auth
         )

 class VisionClient:
     def __init__(self, auth):
+        # with open('temp/client_secret.json') as f:
+        #     auth = json.load(f)
         credentials = service_account.Credentials.from_service_account_info(
             auth
         )