Spaces:

jiang-cc
/

AD-Copilot

Running on Zero

App Files Files Community

jiang-cc commited on Apr 9

Commit

c96fed6

verified ·

1 Parent(s): 9f4294d

fix: pass file paths instead of PIL objects to ZeroGPU worker to avoid serialization TypeError

Browse files

Files changed (1) hide show

app.py +17 -5

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ AD-Copilot Demo: Comparison-Aware Anomaly Detection with Vision-Language Model
 """
 import os
 import traceback
 import spaces
 import gradio as gr
@@ -36,17 +37,18 @@ model = AutoModelForImageTextToText.from_pretrained(
 # ---------------------------------------------------------------------------
 @spaces.GPU(duration=120)
 def _predict_inner(
-    reference_image: Image.Image,
-    test_image: Image.Image,
     prompt: str,
     max_new_tokens: int,
 ):
     with torch.inference_mode():
         max_new_tokens = int(max_new_tokens)
         # Resize long edge to 512 to save GPU memory / speed up
-        reference_image = reference_image.copy()
-        test_image = test_image.copy()
         reference_image.thumbnail((512, 512), Image.Resampling.LANCZOS)
         test_image.thumbnail((512, 512), Image.Resampling.LANCZOS)
@@ -97,7 +99,17 @@ def predict(
     if reference_image is None or test_image is None:
         return "Please upload both a reference (good) image and a test image."
     try:
-        return _predict_inner(reference_image, test_image, prompt, max_new_tokens)
     except Exception as e:
         tb = traceback.format_exc()
         print(tb, flush=True)

 """
 import os
+import tempfile
 import traceback
 import spaces
 import gradio as gr
 # ---------------------------------------------------------------------------
 @spaces.GPU(duration=120)
 def _predict_inner(
+    ref_path: str,
+    test_path: str,
     prompt: str,
     max_new_tokens: int,
 ):
     with torch.inference_mode():
         max_new_tokens = int(max_new_tokens)
+        reference_image = Image.open(ref_path).convert("RGB")
+        test_image = Image.open(test_path).convert("RGB")
         # Resize long edge to 512 to save GPU memory / speed up
         reference_image.thumbnail((512, 512), Image.Resampling.LANCZOS)
         test_image.thumbnail((512, 512), Image.Resampling.LANCZOS)
     if reference_image is None or test_image is None:
         return "Please upload both a reference (good) image and a test image."
     try:
+        # Save PIL images to temp files to avoid serialization issues with ZeroGPU
+        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as f:
+            reference_image.save(f, format="PNG")
+            ref_path = f.name
+        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as f:
+            test_image.save(f, format="PNG")
+            test_path = f.name
+        result = _predict_inner(ref_path, test_path, prompt, max_new_tokens)
+        os.unlink(ref_path)
+        os.unlink(test_path)
+        return result
     except Exception as e:
         tb = traceback.format_exc()
         print(tb, flush=True)