Spaces:

mgokg
/

MultimodalLiveApi

Sleeping

mgokg commited on Mar 9

Commit

8ccf021

verified ·

1 Parent(s): 35d364a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,6 +9,25 @@ def process_pdf(file):
     for page in pdf_reader.pages:
         text += page.extract_text()
     return text
 with gr.Blocks() as demo:
     gr.Markdown("### File upload", elem_classes="tab-header")
@@ -18,6 +37,6 @@ with gr.Blocks() as demo:
         file_input = gr.File(label="Wähle eine PDF-Datei aus", type="filepath")
     with gr.Row():
         submit_button = gr.Button("upload")
-    submit_button.click(process_pdf, inputs=file_input, outputs=text_output)
 demo.launch()

     for page in pdf_reader.pages:
         text += page.extract_text()
     return text
+def process_file(file):
+    file_extension = file.name.split(".")[-1].lower()
+    if file_extension == 'pdf':
+        ocr_text = process_pdf(file)
+        return ocr_text
+    elif file_extension == 'docx':
+        docx_document = DocxDocument(file.name)
+        text = ""
+        for paragraph in docx_document.paragraphs:
+            text += paragraph.text + "\n"
+        return text
+    #return [Document(text=text)]
 with gr.Blocks() as demo:
     gr.Markdown("### File upload", elem_classes="tab-header")
         file_input = gr.File(label="Wähle eine PDF-Datei aus", type="filepath")
     with gr.Row():
         submit_button = gr.Button("upload")
+    submit_button.click(process_file, inputs=file_input, outputs=text_output)
 demo.launch()