Spaces:

Shreyansh234
/

Practice_Space

Sleeping

Shreyansh234 commited on Sep 1, 2025

Commit

2d80e92

verified ·

1 Parent(s): bf8eb74

Update src/streamlit_app.py

Files changed (1) hide show

src/streamlit_app.py CHANGED Viewed

@@ -1,16 +1,29 @@
 import streamlit as st
 from PIL import Image
 from transformers import BlipProcessor, BlipForConditionalGeneration
-# Load model + processor (BLIP for image captioning)
 @st.cache_resource
 def load_model():
-    processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base")
-    model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base")
     return processor, model
 processor, model = load_model()
 st.title("🖼️ Image to Text (Caption Generator)")
 st.write("Upload an image and get a text caption generated by a Transformer model 🚀")
@@ -21,10 +34,11 @@ if uploaded_file is not None:
     image = Image.open(uploaded_file).convert("RGB")
     st.image(image, caption="Uploaded Image", use_column_width=True)
-    if st.button("Generate Caption"):
-        inputs = processor(image, return_tensors="pt")
-        out = model.generate(**inputs, max_new_tokens=30)
-        caption = processor.decode(out[0], skip_special_tokens=True)
         st.subheader("📝 Generated Caption:")
         st.success(caption)

+import os
 import streamlit as st
 from PIL import Image
 from transformers import BlipProcessor, BlipForConditionalGeneration
+# ✅ Fix cache issue: force Hugging Face to use /tmp for model storage
+os.environ["HF_HOME"] = "/tmp"
+os.environ["TRANSFORMERS_CACHE"] = "/tmp"
+# Load BLIP model + processor (cached in /tmp)
 @st.cache_resource
 def load_model():
+    processor = BlipProcessor.from_pretrained(
+        "Salesforce/blip-image-captioning-base",
+        cache_dir="/tmp"
+    )
+    model = BlipForConditionalGeneration.from_pretrained(
+        "Salesforce/blip-image-captioning-base",
+        cache_dir="/tmp"
+    )
     return processor, model
 processor, model = load_model()
+# Streamlit UI
+st.set_page_config(page_title="Image → Text Captioning", page_icon="🖼️")
 st.title("🖼️ Image to Text (Caption Generator)")
 st.write("Upload an image and get a text caption generated by a Transformer model 🚀")
     image = Image.open(uploaded_file).convert("RGB")
     st.image(image, caption="Uploaded Image", use_column_width=True)
+    if st.button("✨ Generate Caption"):
+        with st.spinner("Generating caption... please wait ⏳"):
+            inputs = processor(image, return_tensors="pt")
+            output_ids = model.generate(**inputs, max_new_tokens=30)
+            caption = processor.decode(output_ids[0], skip_special_tokens=True)
         st.subheader("📝 Generated Caption:")
         st.success(caption)