Spaces:

hskwon7
/

ISOM5240-Individual-Assignment

Sleeping

App Files Files Community

hskwon7 commited on Apr 29, 2025

Commit

6c53b18

verified ·

1 Parent(s): 3ac5eff

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -12

app.py CHANGED Viewed

@@ -3,8 +3,9 @@
 app.py
 Streamlit application for Image-to-Story demo.
-Allows users to upload an image, generates a caption, creates a child-friendly story,
 and plays it back as audio.
 """
 import streamlit as st
 from PIL import Image
@@ -25,7 +26,8 @@ warnings.filterwarnings("ignore", category=DeprecationWarning)
 def main():
     st.title("🖼️ → 📖 Image-to-Story App for Kids")
     st.write(
-        "Upload an image, get a caption, spin it into a story, and play it aloud!"
     )
     # Load pipelines (cached) with a friendly spinner
@@ -40,25 +42,37 @@ def main():
     story_gen = st.session_state.story_gen
     tts_pipe  = st.session_state.tts_pipe
-    # File uploader for images
-    uploaded = st.file_uploader(
-        "Upload an image (PNG, JPG, JPEG)", type=["png", "jpg", "jpeg"]
     )
-    if not uploaded:
-        return
-    # Display uploaded image
-    img = Image.open(uploaded)
     st.image(img, use_container_width=True)
     # Generate caption once
-    if "caption" not in st.session_state:
         with st.spinner("Generating image caption…"):
             st.session_state.caption = generate_caption(captioner, img)
     st.markdown(f"**Caption:** {st.session_state.caption}")
     # Generate story once
-    if "story" not in st.session_state:
         with st.spinner("Creating story for kids…"):
             st.session_state.story = generate_story(
                 story_gen,
@@ -66,14 +80,16 @@ def main():
                 min_words=50,
                 max_words=100
             )
     st.markdown(f"**Story:** {st.session_state.story}")
     # Generate TTS audio once
-    if "audio_data" not in st.session_state:
         with st.spinner("Synthesizing speech…"):
             audio_array, sr = generate_audio(tts_pipe, st.session_state.story)
             st.session_state.audio_data = audio_array
             st.session_state.audio_sr   = sr
     # Audio playback button
     if st.button("🔊 Play Story Audio"):

 app.py
 Streamlit application for Image-to-Story demo.
+Allows users to upload an image or use a demo image, generates a caption, creates a child-friendly story,
 and plays it back as audio.
+Suitable for deployment on Hugging Face Spaces.
 """
 import streamlit as st
 from PIL import Image
 def main():
     st.title("🖼️ → 📖 Image-to-Story App for Kids")
     st.write(
+        "Upload an image or use the demo image to get an engaging story suitable for 3–10 year-olds, "
+        "with audio playback powered by Hugging Face pipelines!"
     )
     # Load pipelines (cached) with a friendly spinner
     story_gen = st.session_state.story_gen
     tts_pipe  = st.session_state.tts_pipe
+    # Choose image source
+    source = st.radio(
+        "Choose image source:",
+        ("Upload my own image", "Use demo image")
     )
+    if source == "Use demo image":
+        # Load the bundled demo image
+        img = Image.open("test_kids_playing.jpg")
+    else:
+        uploaded = st.file_uploader(
+            "Upload an image (PNG, JPG, JPEG)",
+            type=["png", "jpg", "jpeg"],
+            key="upload"
+        )
+        if not uploaded:
+            return
+        img = Image.open(uploaded)
+    # Display image
     st.image(img, use_container_width=True)
     # Generate caption once
+    if "caption" not in st.session_state or source != st.session_state.get("last_source"):
         with st.spinner("Generating image caption…"):
             st.session_state.caption = generate_caption(captioner, img)
+            st.session_state.last_source = source
     st.markdown(f"**Caption:** {st.session_state.caption}")
     # Generate story once
+    if "story" not in st.session_state or source != st.session_state.get("last_source"):
         with st.spinner("Creating story for kids…"):
             st.session_state.story = generate_story(
                 story_gen,
                 min_words=50,
                 max_words=100
             )
+            st.session_state.last_source = source
     st.markdown(f"**Story:** {st.session_state.story}")
     # Generate TTS audio once
+    if "audio_data" not in st.session_state or source != st.session_state.get("last_source"):
         with st.spinner("Synthesizing speech…"):
             audio_array, sr = generate_audio(tts_pipe, st.session_state.story)
             st.session_state.audio_data = audio_array
             st.session_state.audio_sr   = sr
+            st.session_state.last_source = source
     # Audio playback button
     if st.button("🔊 Play Story Audio"):