depth-anything-3

Running on Zero

App Files Files Community

linhaotong commited on 30 days ago

Commit

ace4129

1 Parent(s): e59f7b7

update

Browse files

Files changed (3) hide show

app.py +3 -2
depth_anything_3/app/gradio_app.py +7 -1
depth_anything_3/app/modules/model_inference.py +19 -9

app.py CHANGED Viewed

@@ -68,9 +68,10 @@ if __name__ == "__main__":
     print(f"📁 Workspace Directory: {workspace_dir}")
     print(f"🖼️  Gallery Directory: {gallery_dir}")
     app.launch(
         host="0.0.0.0",  # Required for Spaces
         port=7860,       # Standard Gradio port
-        share=False,     # Not needed on Spaces
-        debug=False
     )

     print(f"📁 Workspace Directory: {workspace_dir}")
     print(f"🖼️  Gallery Directory: {gallery_dir}")
+    # Launch with minimal, Spaces-compatible configuration
+    # Some parameters may cause routing issues, so we use minimal config
     app.launch(
         host="0.0.0.0",  # Required for Spaces
         port=7860,       # Standard Gradio port
+        share=False      # Not needed on Spaces
     )

depth_anything_3/app/gradio_app.py CHANGED Viewed

@@ -619,8 +619,14 @@ class DepthAnything3App:
             **kwargs: Additional arguments for demo.launch()
         """
         demo = self.create_app()
         demo.queue(max_size=20).launch(
-            show_error=True, ssr_mode=False, server_name=host, server_port=port, **kwargs
         )

             **kwargs: Additional arguments for demo.launch()
         """
         demo = self.create_app()
+        # Configure launch settings for Spaces compatibility
+        # Use minimal config to avoid routing issues
         demo.queue(max_size=20).launch(
+            show_error=True,
+            ssr_mode=False,
+            server_name=host,
+            server_port=port,
+            **kwargs
         )

depth_anything_3/app/modules/model_inference.py CHANGED Viewed

@@ -54,32 +54,42 @@ class ModelInference:
         """
         Initialize the DepthAnything3 model using global cache.
         This uses a global variable which is safe because @spaces.GPU
         runs in isolated subprocess, each with its own global namespace.
         Args:
-            device: Device to load the model on
         Returns:
-            Model instance ready for inference
         """
         global _MODEL_CACHE
         if _MODEL_CACHE is None:
             # First time loading in this subprocess
             model_dir = os.environ.get(
                 "DA3_MODEL_DIR", "depth-anything/DA3NESTED-GIANT-LARGE"
             )
-            print(f"🔄 Loading model from {model_dir}...")
             _MODEL_CACHE = DepthAnything3.from_pretrained(model_dir)
-            _MODEL_CACHE = _MODEL_CACHE.to(device)
             _MODEL_CACHE.eval()
-            print("✅ Model loaded and ready on GPU")
-        else:
-            # Model already cached in this subprocess
-            print("✅ Using cached model")
-            # Ensure it's on the correct device
             _MODEL_CACHE = _MODEL_CACHE.to(device)
         return _MODEL_CACHE

         """
         Initialize the DepthAnything3 model using global cache.
+        Optimization: Load model to CPU first, then move to GPU when needed.
+        This is faster than reloading from disk each time.
         This uses a global variable which is safe because @spaces.GPU
         runs in isolated subprocess, each with its own global namespace.
         Args:
+            device: Device to run inference on (will move model to this device)
         Returns:
+            Model instance ready for inference on specified device
         """
         global _MODEL_CACHE
         if _MODEL_CACHE is None:
             # First time loading in this subprocess
+            # Load to CPU first (faster than loading directly to GPU)
             model_dir = os.environ.get(
                 "DA3_MODEL_DIR", "depth-anything/DA3NESTED-GIANT-LARGE"
             )
+            print(f"🔄 Loading model from {model_dir} to CPU...")
+            print("   (Model files are cached on disk)")
             _MODEL_CACHE = DepthAnything3.from_pretrained(model_dir)
+            # Load to CPU first (faster, and allows reuse)
+            _MODEL_CACHE = _MODEL_CACHE.to("cpu")
             _MODEL_CACHE.eval()
+            print("✅ Model loaded to CPU memory (cached in subprocess)")
+        # Move to target device for inference
+        if device != "cpu" and next(_MODEL_CACHE.parameters()).device.type != device:
+            print(f"🚀 Moving model from {next(_MODEL_CACHE.parameters()).device} to {device}...")
             _MODEL_CACHE = _MODEL_CACHE.to(device)
+            print(f"✅ Model ready on {device}")
+        elif device == "cpu":
+            # Already on CPU or requested CPU
+            pass
         return _MODEL_CACHE