Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -44,7 +44,7 @@ if submit:
|
|
44 |
import os
|
45 |
import re
|
46 |
import pdfminer
|
47 |
-
|
48 |
from transformers import pipeline
|
49 |
|
50 |
import streamlit as st
|
@@ -85,7 +85,7 @@ uploaded_file = st.file_uploader("Choose a PDF file")
|
|
85 |
if uploaded_file is not None:
|
86 |
with st.spinner("Processing..."):
|
87 |
text = ""
|
88 |
-
for page_layout in
|
89 |
for element in page_layout:
|
90 |
text += preprocess_text(element) + "\n"
|
91 |
if text:
|
|
|
44 |
import os
|
45 |
import re
|
46 |
import pdfminer
|
47 |
+
from pdfminer.high_level import extract_pages
|
48 |
from transformers import pipeline
|
49 |
|
50 |
import streamlit as st
|
|
|
85 |
if uploaded_file is not None:
|
86 |
with st.spinner("Processing..."):
|
87 |
text = ""
|
88 |
+
for page_layout in extract_pages(uploaded_file):
|
89 |
for element in page_layout:
|
90 |
text += preprocess_text(element) + "\n"
|
91 |
if text:
|