Spaces:

brestok
/

ocr-backend

Running

App Files Files Community

Istvan-Adem commited on Feb 7

Commit

912670d

1 Parent(s): 71a8eab

Make main identical to ai

Browse files

Files changed (7) hide show

ocr/__init__.py +0 -12
ocr/api/message/openai_request.py +17 -0
ocr/api/message/prompts.py +44 -0
ocr/api/message/utils.py +10 -15
ocr/api/message/views.py +6 -2
ocr/core/wrappers.py +30 -0
requirements.txt +2 -0

ocr/__init__.py CHANGED Viewed

@@ -1,9 +1,6 @@
-import os
 from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
 from starlette.exceptions import HTTPException as StarletteHTTPException
-from starlette.staticfiles import StaticFiles
 from ocr.core.config import settings
 from ocr.core.wrappers import OcrResponseWrapper, ErrorOcrResponse
@@ -22,15 +19,6 @@ def create_app() -> FastAPI:
         allow_headers=["*"],
     )
-    static_directory = os.path.join(settings.BASE_DIR, 'static')
-    if not os.path.exists(static_directory):
-        os.makedirs(static_directory)
-    app.mount(
-        '/static',
-        StaticFiles(directory='static'),
-    )
     @app.exception_handler(StarletteHTTPException)
     async def http_exception_handler(_, exc):
         return OcrResponseWrapper(

 from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
 from starlette.exceptions import HTTPException as StarletteHTTPException
 from ocr.core.config import settings
 from ocr.core.wrappers import OcrResponseWrapper, ErrorOcrResponse
         allow_headers=["*"],
     )
     @app.exception_handler(StarletteHTTPException)
     async def http_exception_handler(_, exc):
         return OcrResponseWrapper(

ocr/api/message/openai_request.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from ocr.api.message.prompts import OCRPrompts
+from ocr.core.wrappers import openai_wrapper
+@openai_wrapper(model='gpt-4o-mini')
+async def generate_report(text: str):
+    messages = [
+        {
+            "role": "system",
+            "content": OCRPrompts.generate_general_answer
+        },
+        {
+            "role": "user",
+            "content": f"Generate a report based on this data:\n\n```\n{text}\n```"
+        }
+    ]
+    return messages

ocr/api/message/prompts.py ADDED Viewed

	@@ -0,0 +1,44 @@

+class OCRPrompts:
+    generate_general_answer = """## Task
+You must analyze the text extracted from medical document and generate a comprehensive report in **Markdown2** format. Ensure that every detail provided in the document is included, and do not omit or modify any information. Your output must strictly follow the required format.
+## Report Structure
+The report should be structured as follows, with each section containing only relevant information from the document:
+```markdown
+## Patient Information
+- Name: [Patient Name]
+- Age: [Patient Age]
+- Date of Scan: [Date]
+- Indication: [Reason for the CT scan]
+## Findings
+**Primary findings**:
+[Describe significant abnormalities or findings relevant to the indication]
+** Secondary findings**:
+[List incidental findings, e.g., "Mild hepatic steatosis noted."]
+**No abnormalities**:
+[Mention organs or systems without abnormalities, e.g., "No evidence of lymphadenopathy or pleural effusion."]
+## Impression
+[Summarize the findings concisely, e.g., "Findings suggest a primary lung tumor. Biopsy recommended for further evaluation."]
+## Recommendations
+[Include next steps or further tests, e.g., "PET scan and consultation with oncology recommended."]
+```
+[INST]
+## Instructions
+- **Do not invent or infer any information.** Only use data provided in the user request.
+- Ensure that the format is followed strictly, and the output is complete without any deviations.
+[/INST]"""

ocr/api/message/utils.py CHANGED Viewed

@@ -1,7 +1,8 @@
-import base64
 import io
 import re
 from pdf2image import convert_from_bytes
@@ -16,21 +17,15 @@ def divide_images(contents: bytes) -> list[bytes]:
     return image_bytes_list
-def prepare_request_content(images: list[bytes]):
-    content = [
-        {"type": "text", "text": "Generate a report on the attached document"},
-        *[
-            {
-                "type": "image_url",
-                "image_url": {
-                    "url": f"data:image/jpeg;base64,{base64.b64encode(image).decode('utf-8')}",
-                },
-            }
-            for image in images
-        ]
-    ]
-    return content
 def clean_response(text: str) -> str:
     try:

 import io
 import re
+import pytesseract
+from PIL import Image
 from pdf2image import convert_from_bytes
     return image_bytes_list
+def extract_text_from_images(images: list[bytes]) -> str:
+    extracted_texts = []
+    for image_bytes in images:
+        image = Image.open(io.BytesIO(image_bytes))
+        text = pytesseract.image_to_string(image)
+        extracted_texts.append(text)
+    return '\n'.join(extracted_texts)
 def clean_response(text: str) -> str:
     try:

ocr/api/message/views.py CHANGED Viewed

@@ -1,8 +1,9 @@
 from fastapi import File, UploadFile
 from ocr.api.message import ocr_router
 from ocr.api.message.schemas import OcrResponse
-from ocr.api.message.utils import divide_images, prepare_request_content, clean_response
 from ocr.core.wrappers import OcrResponseWrapper
@@ -12,6 +13,9 @@ async def get_all_chat_messages(
 ) -> OcrResponseWrapper[OcrResponse]:
     try:
         contents = await file.read()
-        return OcrResponseWrapper(data=OcrResponse(text=clean_response("## Coming soon")))
     finally:
         await file.close()

 from fastapi import File, UploadFile
 from ocr.api.message import ocr_router
+from ocr.api.message.openai_request import generate_report
 from ocr.api.message.schemas import OcrResponse
+from ocr.api.message.utils import divide_images, clean_response, extract_text_from_images
 from ocr.core.wrappers import OcrResponseWrapper
 ) -> OcrResponseWrapper[OcrResponse]:
     try:
         contents = await file.read()
+        images = divide_images(contents)
+        text_content = extract_text_from_images(images)
+        response = await generate_report(text_content)
+        return OcrResponseWrapper(data=OcrResponse(text=clean_response(response)))
     finally:
         await file.close()

ocr/core/wrappers.py CHANGED Viewed

@@ -1,10 +1,14 @@
 from functools import wraps
 from typing import Generic, Optional, TypeVar
 from fastapi import HTTPException
 from pydantic import BaseModel
 from starlette.responses import JSONResponse
 T = TypeVar('T')
@@ -42,6 +46,32 @@ def exception_wrapper(http_error: int, error_message: str):
     return decorator
 def background_task():
     def decorator(func):
         @wraps(func)

+import json
 from functools import wraps
 from typing import Generic, Optional, TypeVar
+import pydash
 from fastapi import HTTPException
 from pydantic import BaseModel
 from starlette.responses import JSONResponse
+from ocr.core.config import settings
 T = TypeVar('T')
     return decorator
+def openai_wrapper(
+        temperature: int | float = 0, model: str = "gpt-4o-mini", is_json: bool = False, return_: str = None
+):
+    def decorator(func):
+        @wraps(func)
+        async def wrapper(*args, **kwargs) -> str:
+            messages = await func(*args, **kwargs)
+            completion = await settings.OPENAI_CLIENT.chat.completions.create(
+                messages=messages,
+                temperature=temperature,
+                n=1,
+                model=model,
+                response_format={"type": "json_object"} if is_json else {"type": "text"}
+            )
+            response = completion.choices[0].message.content
+            if is_json:
+                response = json.loads(response)
+                if return_:
+                    return pydash.get(response, return_)
+            return response
+        return wrapper
+    return decorator
 def background_task():
     def decorator(func):
         @wraps(func)

requirements.txt CHANGED Viewed

@@ -11,11 +11,13 @@ httpx==0.28.1
 idna==3.10
 jiter==0.8.2
 openai==1.59.9
 pdf2image==1.17.0
 pillow==11.1.0
 pydantic==2.10.5
 pydantic_core==2.27.2
 pydash==8.0.5
 python-dotenv==1.0.1
 python-multipart==0.0.20
 PyYAML==6.0.2

 idna==3.10
 jiter==0.8.2
 openai==1.59.9
+packaging==24.2
 pdf2image==1.17.0
 pillow==11.1.0
 pydantic==2.10.5
 pydantic_core==2.27.2
 pydash==8.0.5
+pytesseract==0.3.13
 python-dotenv==1.0.1
 python-multipart==0.0.20
 PyYAML==6.0.2