Spaces:

miltonc
/

5240_assignment1

Sleeping

App Files Files Community

miltonc commited on Mar 1, 2025

Commit

885aabb

1 Parent(s): 5cd11e3

first commit

Browse files

Files changed (2) hide show

app.py +59 -0
requirements.txt +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,59 @@

+import streamlit as st
+from transformers import pipeline
+from gtts import gTTS
+import os
+from PIL import Image
+# Load models
+def load_models():
+    image_to_text = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
+    summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
+    return image_to_text, summarizer
+# Process image to text
+def generate_caption(image, image_to_text):
+    result = image_to_text(image)
+    return result[0]["generated_text"] if result else "No caption generated."
+# Summarize text
+def summarize_text(text, summarizer):
+    summary = summarizer(text, max_length=30, min_length=10, do_sample=False)
+    return summary[0]["summary_text"] if summary else "No summary generated."
+# Convert text to speech
+def text_to_speech(text, filename="output.mp3"):
+    tts = gTTS(text)
+    tts.save(filename)
+    return filename
+# Main Streamlit app
+def main():
+    st.title("AI-Powered Image Captioning, Summarization, and Speech")
+    image_to_text, summarizer = load_models()
+    uploaded_file = st.file_uploader("Upload an image...", type=["jpg", "png", "jpeg"])
+    if uploaded_file is not None:
+        # Convert uploaded file to a PIL image
+        image = Image.open(uploaded_file)
+        # Display the uploaded image
+        st.image(image, caption="Uploaded Image", use_column_width=True)
+        with st.spinner("Generating caption..."):
+            caption = generate_caption(image, image_to_text)
+            st.write("### Image Caption:")
+            st.write(caption)
+        with st.spinner("Summarizing caption..."):
+            summary = summarize_text(caption, summarizer)
+            st.write("### Summary:")
+            st.write(summary)
+        with st.spinner("Generating speech..."):
+            audio_file = text_to_speech(summary)
+            st.audio(audio_file, format="audio/mp3")
+if __name__ == "__main__":
+    main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+streamlit
+transformers
+torch
+Pillow
+gtts