Spaces:

IrisDeng
/

UST_Deep_learning_asm1

Running

App Files Files Community

IrisDeng commited on 1 day ago

Commit

1e8859c

verified ·

1 Parent(s): 9e09636

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -9

app.py CHANGED Viewed

@@ -6,7 +6,6 @@ import torch
 st.set_page_config(page_title="Image-to-Audio Story Generator", page_icon="🦜")
 def create_image_caption(image_file):
     pil_image = Image.open(image_file)
     caption_generator = pipeline(
@@ -17,7 +16,7 @@ def create_image_caption(image_file):
     generated_caption = caption_result[0]["generated_text"]
     return generated_caption
-def build_children_story(image_description):
     story_generator = pipeline(
         "text-generation",
         model="Qwen/Qwen2.5-0.5B-Instruct",
@@ -28,10 +27,10 @@ def build_children_story(image_description):
         "Using the details derived from the image below, craft a complete and captivating tale that includes three main characters, "
         "an adventurous journey, and delightful surprises. "
         "Your story should have a clear beginning, middle, and end, and be between 80 and 100 words in length.\n\n"
-        f"Image Details: {caption_result}\n\nStory:"
     )
-    generated_output = story_pipeline(
         story_prompt,
         max_new_tokens=150,
         num_return_sequences=1,
@@ -63,13 +62,11 @@ def build_children_story(image_description):
     return story_text
 def convert_text_to_audio(story_content, audio_file_name="output.mp3"):
     tts = gTTS(text=story_content, lang="en")
     tts.save(audio_file_name)
     return audio_file_name
 def main_app():
     st.markdown("<h1 style='text-align: center;'>Image-to-Audio Story Generator 🦜</h1>", unsafe_allow_html=True)
     st.write("Upload an image below to generate an engaging story from the picture, then convert the story into audio playback!")
@@ -93,6 +90,4 @@ def main_app():
             audio_file_name = convert_text_to_audio(story_content)
         st.audio(audio_file_name, format="audio/mp3")
-if __name__ == "__main__":
-    main_app()

 st.set_page_config(page_title="Image-to-Audio Story Generator", page_icon="🦜")
 def create_image_caption(image_file):
     pil_image = Image.open(image_file)
     caption_generator = pipeline(
     generated_caption = caption_result[0]["generated_text"]
     return generated_caption
+def build_children_story(image_caption):  # Updated parameter name
     story_generator = pipeline(
         "text-generation",
         model="Qwen/Qwen2.5-0.5B-Instruct",
         "Using the details derived from the image below, craft a complete and captivating tale that includes three main characters, "
         "an adventurous journey, and delightful surprises. "
         "Your story should have a clear beginning, middle, and end, and be between 80 and 100 words in length.\n\n"
+        f"Image Details: {image_caption}\n\nStory:"
     )
+    generated_output = story_generator(
         story_prompt,
         max_new_tokens=150,
         num_return_sequences=1,
     return story_text
 def convert_text_to_audio(story_content, audio_file_name="output.mp3"):
     tts = gTTS(text=story_content, lang="en")
     tts.save(audio_file_name)
     return audio_file_name
 def main_app():
     st.markdown("<h1 style='text-align: center;'>Image-to-Audio Story Generator 🦜</h1>", unsafe_allow_html=True)
     st.write("Upload an image below to generate an engaging story from the picture, then convert the story into audio playback!")
             audio_file_name = convert_text_to_audio(story_content)
         st.audio(audio_file_name, format="audio/mp3")
+if __name__ == "__main