Spaces:
Sleeping
Sleeping
# streamlit_ui.py | |
import streamlit as st | |
import requests | |
import base64 | |
import tempfile | |
from backend.subtitle_utils import generate_srt_from_text, enhance_video_with_subtitles_and_bgm | |
st.set_page_config( | |
page_title="Prompta - Text to Media Generator", | |
page_icon="ποΈ", | |
layout="wide", | |
initial_sidebar_state="expanded" | |
) | |
st.title("ποΈπΌοΈποΈ Prompta - Text to Media Generator") | |
API_BASE = "http://localhost:8000" | |
def render_media(file_bytes, media_type, label): | |
b64 = base64.b64encode(file_bytes).decode() | |
if media_type == "audio": | |
st.audio(f"data:audio/wav;base64,{b64}", format="audio/wav") | |
elif media_type == "video": | |
st.video(f"data:video/mp4;base64,{b64}") | |
elif media_type == "image": | |
st.image(file_bytes, caption=label, use_column_width=True) | |
st.sidebar.header("π οΈ Settings") | |
TOKEN = st.sidebar.text_input("π API Token", type="password") | |
HEADERS = {"Authorization": f"Bearer {TOKEN}"} if TOKEN else {} | |
tab = st.sidebar.radio("Select Task", ["Text to Audio", "Text to Image", "Text to Video"]) | |
if tab == "Text to Audio": | |
st.subheader("π€ Text to Audio") | |
text = st.text_area("Enter text") | |
voice = st.selectbox("Choose voice/language", ["en-US", "hi-IN", "te-IN", "ta-IN"]) | |
if st.button("π Generate Audio"): | |
with st.spinner("Generating audio..."): | |
r = requests.post(f"{API_BASE}/audio/generate", json={"text": text, "voice": voice}, headers=HEADERS) | |
if r.status_code == 200: | |
render_media(r.content, "audio", "Generated Audio") | |
else: | |
st.error(f"β Failed: {r.json().get('detail')}") | |
elif tab == "Text to Image": | |
st.subheader("πΌοΈ Text to Image") | |
prompt = st.text_area("Enter image prompt") | |
model = st.selectbox("Choose model", ["sdxl", "deepfloyd", "kandinsky"]) | |
if st.button("π§ Generate Image"): | |
with st.spinner("Generating image..."): | |
r = requests.post(f"{API_BASE}/image/generate", json={"prompt": prompt, "model": model}, headers=HEADERS) | |
if r.status_code == 200: | |
render_media(r.content, "image", "Generated Image") | |
else: | |
st.error(f"β Failed: {r.json().get('detail')}") | |
elif tab == "Text to Video": | |
st.subheader("ποΈ Text to Video") | |
prompt = st.text_area("Enter video prompt") | |
tone = st.selectbox("Tone", ["formal", "casual", "emotional", "documentary"]) | |
domain = st.selectbox("Domain", ["health", "education", "governance", "entertainment"]) | |
environment = st.selectbox("Environment", ["urban", "rural", "nature", "futuristic"]) | |
transcript = st.text_area("Transcript (optional - for subtitles)", height=100) | |
enhance = st.checkbox("β¨ Add Subtitles and Background Music") | |
if st.button("π¬ Generate Video"): | |
with st.spinner("Generating video..."): | |
r = requests.post( | |
f"{API_BASE}/video/generate", | |
json={"prompt": prompt, "tone": tone, "domain": domain, "environment": environment}, | |
headers=HEADERS | |
) | |
if r.status_code == 200: | |
video_bytes = r.content | |
if enhance and transcript: | |
with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as tmp_vid: | |
tmp_vid.write(video_bytes) | |
tmp_vid_path = tmp_vid.name | |
srt_path = generate_srt_from_text(transcript, output_path="streamlit_subs.srt") | |
enhanced_path = "streamlit_final_video.mp4" | |
enhance_video_with_subtitles_and_bgm( | |
video_path=tmp_vid_path, | |
srt_path=srt_path, | |
bgm_path="default_bgm.mp3", | |
output_path=enhanced_path | |
) | |
with open(enhanced_path, "rb") as f: | |
render_media(f.read(), "video", "Enhanced Video") | |
else: | |
render_media(video_bytes, "video", "Generated Video") | |
else: | |
st.error(f"β Failed: {r.json().get('detail')}") | |
st.sidebar.markdown("---") | |
st.sidebar.info("Built with β€οΈ for AI GovTech Challenge 2025") | |