Spaces:

kingabzpro
/

savtadepth

Running

Abid Ali Awan commited on Oct 30, 2025

Commit

d49d935

1 Parent(s): 87b61df

Enhance app_savta.py with improved model loading and fallback depth estimation

- Added support for Hugging Face flagging with a dataset saver.
- Implemented a fallback depth estimation method using simple edge detection when the model is not found.
- Updated inference logic and Gradio UI to include flagging options and a footer with project links.
- Streamlined model loading process with error handling for better user experience.

Files changed (1) hide show

app/app_savta.py +122 -10

app/app_savta.py CHANGED Viewed

@@ -1,34 +1,141 @@
 from pathlib import Path
-import gradio as gr
 from fastai.vision.all import *
-# Model setup
 MODEL_PATH = Path(__file__).parent.parent / "models" / "model.pth"
 if not MODEL_PATH.exists():
-    raise FileNotFoundError(f"Model not found at {MODEL_PATH}")
-learner = load_learner(MODEL_PATH)
-# Inference function
 def predict_depth(input_img: PILImage) -> PILImageBW:
     depth, *_ = learner.predict(input_img)
     return PILImageBW.create(depth).convert("L")
-# Gradio UI
 title = "📷 SavtaDepth WebApp"
-description_md = """
     <p style="text-align:center;font-size:1.05rem;max-width:760px;margin:auto;">
         Upload an RGB image on the left and get a grayscale depth map on the right.
     </p>
     """
-examples_dir = Path(__file__).parent.parent / "examples"
-examples = [[str(examples_dir / "00008.jpg")], [str(examples_dir / "00045.jpg")]]
 input_component = gr.Image(width=640, height=480, label="Input RGB")
 output_component = gr.Image(label="Predicted Depth", image_mode="L")
@@ -41,9 +148,14 @@ with gr.Blocks(title=title, theme=gr.themes.Soft()) as demo:
         fn=predict_depth,
         inputs=input_component,
         outputs=output_component,
         examples=examples,
         cache_examples=False,
     )
 if __name__ == "__main__":
     demo.queue().launch()

+import os, sys, tempfile, subprocess
 from pathlib import Path
+import torch
 from fastai.vision.all import *
+import gradio as gr
+#######################
+# Hugging Face flags  #
+#######################
+HF_TOKEN = os.getenv("HF_TOKEN")
+try:
+    from gradio.flagging import HuggingFaceDatasetSaver  # type: ignore
+    hf_writer: gr.FlaggingCallback | None = HuggingFaceDatasetSaver(
+        repo_id="savtadepth-flags-V2", token=HF_TOKEN
+    )
+    allow_flagging: str | bool = "manual"
+except (ImportError, AttributeError):
+    hf_writer = None
+    allow_flagging = "never"
+############
+# Model setup without DVC
+############
+# Use local model path
 MODEL_PATH = Path(__file__).parent.parent / "models" / "model.pth"
+# Check if model exists and use fastai approach from working version
 if not MODEL_PATH.exists():
+    print("❌ Model not found at", MODEL_PATH)
+    print("Using fallback depth estimation...")
+    # Fallback to simple image processing
+    class SimpleDepthEstimator:
+        def predict(self, input_img):
+            from PIL import Image
+            import numpy as np
+            # Convert to grayscale if needed
+            if input_img.mode != 'L':
+                img_gray = input_img.convert('L')
+            else:
+                img_gray = input_img
+            # Simple edge detection for depth
+            img_array = np.array(img_gray, dtype=np.float32)
+            grad_x = np.abs(np.diff(img_array, axis=1, prepend=img_array[:, :1]))
+            grad_y = np.abs(np.diff(img_array, axis=0, prepend=img_array[:1, :]))
+            edge_magnitude = np.sqrt(grad_x**2 + grad_y**2)
+            # Create depth based on edges and brightness
+            if edge_magnitude.max() > 0:
+                edge_magnitude = (edge_magnitude - edge_magnitude.min()) / (edge_magnitude.max() - edge_magnitude.min()) * 255
+            normalized_brightness = (img_array - img_array.min()) / (img_array.max() - img_array.min() + 1e-8)
+            depth_factor = 0.6 * (edge_magnitude / 255.0) + 0.4 * (1 - normalized_brightness)
+            depth_factor = np.clip(depth_factor, 0, 1)
+            # Convert back to PIL Image
+            depth_array = (depth_factor * 255).astype(np.uint8)
+            return Image.fromarray(depth_array, mode='L')
+    learner = SimpleDepthEstimator()
+else:
+    try:
+        # Use the working approach from the previous version
+        # Simple approach for inference only (without training data)
+        learn = load_learner(MODEL_PATH)
+        learner = learn
+    except Exception as e:
+        print(f"❌ Failed to load model: {e}")
+        print("Using fallback depth estimation...")
+        class SimpleDepthEstimator:
+            def predict(self, input_img):
+                from PIL import Image
+                import numpy as np
+                # Convert to grayscale if needed
+                if input_img.mode != 'L':
+                    img_gray = input_img.convert('L')
+                else:
+                    img_gray = input_img
+                # Simple edge detection for depth
+                img_array = np.array(img_gray, dtype=np.float32)
+                grad_x = np.abs(np.diff(img_array, axis=1, prepend=img_array[:, :1]))
+                grad_y = np.abs(np.diff(img_array, axis=0, prepend=img_array[:1, :]))
+                edge_magnitude = np.sqrt(grad_x**2 + grad_y**2)
+                # Create depth based on edges and brightness
+                if edge_magnitude.max() > 0:
+                    edge_magnitude = (edge_magnitude - edge_magnitude.min()) / (edge_magnitude.max() - edge_magnitude.min()) * 255
+                normalized_brightness = (img_array - img_array.min()) / (img_array.max() - img_array.min() + 1e-8)
+                depth_factor = 0.6 * (edge_magnitude / 255.0) + 0.4 * (1 - normalized_brightness)
+                depth_factor = np.clip(depth_factor, 0, 1)
+                # Convert back to PIL Image
+                depth_array = (depth_factor * 255).astype(np.uint8)
+                return Image.fromarray(depth_array, mode='L')
+        learner = SimpleDepthEstimator()
+#####################
+#  Inference Logic  #
+#####################
 def predict_depth(input_img: PILImage) -> PILImageBW:
     depth, *_ = learner.predict(input_img)
     return PILImageBW.create(depth).convert("L")
+#####################
+#    Gradio UI      #
+#####################
 title = "📷 SavtaDepth WebApp"
+description_md = (
+    """
     <p style="text-align:center;font-size:1.05rem;max-width:760px;margin:auto;">
         Upload an RGB image on the left and get a grayscale depth map on the right.
     </p>
     """
+)
+footer_html = (
+    """
+    <p style='text-align:center;font-size:0.9rem;'>
+        <a href='https://dagshub.com/OperationSavta/SavtaDepth' target='_blank'>Project on DAGsHub</a> •
+        <a href='https://colab.research.google.com/drive/1XU4DgQ217_hUMU1dllppeQNw3pTRlHy1?usp=sharing' target='_blank'>Google Colab Demo</a>
+    </p>
+    """
+)
+examples = [["examples/00008.jpg"], ["examples/00045.jpg"]]
 input_component = gr.Image(width=640, height=480, label="Input RGB")
 output_component = gr.Image(label="Predicted Depth", image_mode="L")
         fn=predict_depth,
         inputs=input_component,
         outputs=output_component,
+        allow_flagging=allow_flagging,
+        flagging_options=["incorrect", "worst", "ambiguous"],
+        flagging_callback=hf_writer,
         examples=examples,
         cache_examples=False,
     )
+    gr.HTML(footer_html)
 if __name__ == "__main__":
     demo.queue().launch()