Spaces:

videopix
/

image2caption

Sleeping

App Files Files Community

videopix commited on Dec 2, 2025

Commit

eb023cc

verified ·

1 Parent(s): 256d97e

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -26

app.py CHANGED Viewed

@@ -1,13 +1,11 @@
 import io
 import asyncio
-import threading
-import time
-from fastapi import FastAPI, File, UploadFile
 from fastapi.responses import JSONResponse, HTMLResponse
 from PIL import Image
 import torch
 from transformers import AutoProcessor, AutoModelForCausalLM
-import requests
 # ---------------------------------------------------
 # FastAPI App
@@ -16,14 +14,31 @@ app = FastAPI(title="Florence Image Caption API")
 device = "cuda" if torch.cuda.is_available() else "cpu"
-# Lazy load model on first request (prevents HF timeout)
 processor = None
 model = None
 model_lock = asyncio.Lock()
 async def load_model():
-    """Load Florence model only when first needed."""
     global processor, model
     if model is None:
@@ -38,7 +53,6 @@ async def load_model():
 def run_caption(image: Image.Image) -> str:
-    """Perform caption generation."""
     inputs = processor(
         text="<MORE_DETAILED_CAPTION>",
         images=image,
@@ -67,17 +81,17 @@ def run_caption(image: Image.Image) -> str:
 # API Endpoint
 # ---------------------------------------------------
 @app.post("/img2caption")
-async def img2caption(file: UploadFile = File(...)):
     try:
-        # Ensure model is loaded
         async with model_lock:
             await load_model()
-        # Read and convert image
         data = await file.read()
         image = Image.open(io.BytesIO(data)).convert("RGB")
-        # Caption
         caption = run_caption(image)
         return {"caption": caption}
@@ -87,10 +101,10 @@ async def img2caption(file: UploadFile = File(...)):
 # ---------------------------------------------------
-# Simple HTML UI
 # ---------------------------------------------------
 @app.get("/", response_class=HTMLResponse)
-def ui():
     return """
 <!DOCTYPE html>
 <html>
@@ -99,19 +113,11 @@ def ui():
     <style>
         body { font-family: Arial; max-width: 650px; margin: 40px auto; }
         h2 { text-align: center; }
-        #preview {
-            width: 100%; margin-top: 15px; display: none;
-            border-radius: 8px;
-        }
-        #captionBox {
-            margin-top: 20px; padding: 15px;
-            background: #eee; border-radius: 6px; display: none;
-        }
-        button {
-            padding: 12px; width: 100%; margin-top: 10px;
-            background: #4A90E2; color: white; border: none;
-            border-radius: 6px; cursor: pointer; font-size: 16px;
-        }
         button:hover { background: #357ABD; }
     </style>
 </head>
@@ -127,6 +133,13 @@ def ui():
     <div id="captionBox"></div>
 <script>
     const imageInput = document.getElementById("imageInput");
     const preview = document.getElementById("preview");
     const captionBox = document.getElementById("captionBox");
@@ -154,6 +167,7 @@ def ui():
         const res = await fetch("/img2caption", {
             method: "POST",
             body: form
         });
@@ -167,6 +181,9 @@ def ui():
 """
 def keep_alive():
     pass

 import io
 import asyncio
+import os
+from fastapi import FastAPI, File, UploadFile, Depends, Header, HTTPException
 from fastapi.responses import JSONResponse, HTMLResponse
 from PIL import Image
 import torch
 from transformers import AutoProcessor, AutoModelForCausalLM
 # ---------------------------------------------------
 # FastAPI App
 device = "cuda" if torch.cuda.is_available() else "cpu"
+# Lazy-loaded model and processor
 processor = None
 model = None
 model_lock = asyncio.Lock()
+# ---------------------------------------------------
+# Token Authentication
+# ---------------------------------------------------
+API_TOKEN = os.getenv("img2caption")   # your secret token from variables
+async def verify_token(authorization: str = Header(None)):
+    if authorization is None or not authorization.startswith("Bearer "):
+        raise HTTPException(status_code=401, detail="Missing Authorization header")
+    token = authorization.split("Bearer ")[-1].strip()
+    if token != API_TOKEN:
+        raise HTTPException(status_code=403, detail="Invalid token")
+# ---------------------------------------------------
+# Lazy Florence Model Load
+# ---------------------------------------------------
 async def load_model():
     global processor, model
     if model is None:
 def run_caption(image: Image.Image) -> str:
     inputs = processor(
         text="<MORE_DETAILED_CAPTION>",
         images=image,
 # API Endpoint
 # ---------------------------------------------------
 @app.post("/img2caption")
+async def img2caption(
+    file: UploadFile = File(...),
+    _: None = Depends(verify_token)
+):
     try:
         async with model_lock:
             await load_model()
         data = await file.read()
         image = Image.open(io.BytesIO(data)).convert("RGB")
         caption = run_caption(image)
         return {"caption": caption}
 # ---------------------------------------------------
+# Protected HTML UI
 # ---------------------------------------------------
 @app.get("/", response_class=HTMLResponse)
+async def ui(_: None = Depends(verify_token)):
     return """
 <!DOCTYPE html>
 <html>
     <style>
         body { font-family: Arial; max-width: 650px; margin: 40px auto; }
         h2 { text-align: center; }
+        #preview { width: 100%; margin-top: 15px; display: none; border-radius: 8px; }
+        #captionBox { margin-top: 20px; padding: 15px; background: #eee; border-radius: 6px; display: none; }
+        button { padding: 12px; width: 100%; margin-top: 10px;
+                 background: #4A90E2; color: white; border: none;
+                 border-radius: 6px; cursor: pointer; font-size: 16px; }
         button:hover { background: #357ABD; }
     </style>
 </head>
     <div id="captionBox"></div>
 <script>
+    let token = sessionStorage.getItem("authToken");
+    if (!token) {
+        token = prompt("Enter access token:");
+        sessionStorage.setItem("authToken", token);
+    }
     const imageInput = document.getElementById("imageInput");
     const preview = document.getElementById("preview");
     const captionBox = document.getElementById("captionBox");
         const res = await fetch("/img2caption", {
             method: "POST",
+            headers: { "Authorization": "Bearer " + token },
             body: form
         });
 """
+# ---------------------------------------------------
+# Run locally
+# ---------------------------------------------------
 def keep_alive():
     pass