Spaces:

Chamin09
/

BrailleMenuGen

Runtime error

App Files Files Community

BrailleMenuGen / app_bk2.py

Chamin09

Upload 17 files

87d0988 verified 4 months ago

raw

history blame contribute delete

3.86 kB

	import streamlit as st
	from PIL import Image
	import io
	import numpy as np

	# Import our custom modules
	from utils.image_preprocessing import preprocess_image
	from models.document_ai import extract_text_and_layout
	from models.text_processor import process_menu_text

	# App title and description
	st.title("Menu to Braille Converter")
	st.write("Upload a menu image to convert it to Braille text")

	# Sidebar for model settings
	st.sidebar.header("Settings")
	use_llm = st.sidebar.checkbox("Use LLM for text processing", value=True)

	# Add information about the application
	st.sidebar.markdown("---")
	st.sidebar.subheader("About")
	st.sidebar.info(
	"This application converts menu images to Braille text using AI. "
	"It extracts text from images using document AI, processes the text with LLMs, "
	"and will convert to Braille in future versions."
	)

	# File uploader
	uploaded_file = st.file_uploader("Choose a menu image...", type=["jpg", "jpeg", "png"])

	# Display uploaded image and process it
	if uploaded_file is not None:
	# Load and display image
	image = Image.open(uploaded_file)
	st.image(image, caption="Uploaded Menu", use_column_width=True)

	# Add a button to process the image
	if st.button("Process Menu"):
	with st.spinner("Processing image..."):
	# Preprocess the image
	preprocessed_img = preprocess_image(image)

	# Extract text using LayoutLMv2
	try:
	result = extract_text_and_layout(preprocessed_img)

	# Display extracted words
	if result['words']:
	raw_text = ' '.join(result['words'])

	# Show raw text in an expandable section
	with st.expander("Raw Extracted Text"):
	st.text_area("Raw OCR Output", raw_text, height=150)

	# Process text with LLM if enabled
	if use_llm:
	st.subheader("Processed Menu Text")
	with st.spinner("Enhancing text with AI..."):
	processed_result = process_menu_text(raw_text)

	if processed_result['success']:
	st.text_area("Structured Menu Text",
	processed_result['structured_text'],
	height=300)

	# Store the processed result for later use
	st.session_state.processed_text = processed_result['structured_text']
	st.session_state.menu_data = processed_result.get('menu_data', {})
	else:
	st.warning(f"AI processing failed: {processed_result.get('error', 'Unknown error')}")
	st.text_area("Text Output", raw_text, height=300)
	st.session_state.processed_text = raw_text
	else:
	# Just use the raw text
	st.subheader("Extracted Text")
	st.text_area("Text Output", raw_text, height=300)
	st.session_state.processed_text = raw_text
	else:
	st.warning("No text was extracted from the image.")

	except Exception as e:
	st.error(f"Error processing image: {str(e)}")

	# Placeholders for future functionality
	st.subheader("Braille Translation")
	st.info("Braille translation will be implemented in Phase 4")

	st.subheader("Download Options")
	st.info("PDF download will be implemented in Phase 5")