Spaces:

raylim
/

mosaic-zero

Sleeping

App Files Files Community

raylim commited on Dec 8, 2025

Commit

3f232ad

unverified ·

1 Parent(s): 875e616

Optimize batch sizes for H100 ZeroGPU and reduce Optimus duration

Browse files

- Reduce Optimus GPU duration from 600s to 300s to fit ZeroGPU limits
- Increase batch_size to 128 on ZeroGPU (H100) for better throughput
- Apply batch_size optimization to both CTransPath and Optimus
- Keep batch_size=64 for non-ZeroGPU environments
- Estimated throughput: 12,000-15,000 tiles in 300s with H-optimus-0

Files changed (1) hide show

src/mosaic/analysis.py +11 -5

src/mosaic/analysis.py CHANGED Viewed

@@ -59,8 +59,11 @@ def _extract_ctranspath_features(coords, slide_path, attrs, num_workers):
         num_workers = max(num_workers, 8)
         logger.info(f"Running CTransPath with num_workers={num_workers}")
     start_time = pd.Timestamp.now()
-    logger.info("Extracting CTransPath features")
     ctranspath_features, _ = get_features(
         coords,
         slide_path,
@@ -68,7 +71,7 @@ def _extract_ctranspath_features(coords, slide_path, attrs, num_workers):
         model_type=ModelType.CTRANSPATH,
         model_path="data/ctranspath.pth",
         num_workers=num_workers,
-        batch_size=64,
         use_gpu=True,
     )
     end_time = pd.Timestamp.now()
@@ -85,7 +88,7 @@ def _extract_ctranspath_features(coords, slide_path, attrs, num_workers):
     return ctranspath_features, coords
-@spaces.GPU(duration=600)
 def _extract_optimus_features(filtered_coords, slide_path, attrs, num_workers):
     """Extract Optimus features on GPU.
@@ -105,8 +108,11 @@ def _extract_optimus_features(filtered_coords, slide_path, attrs, num_workers):
         num_workers = max(num_workers, 8)
         logger.info(f"Running Optimus with num_workers={num_workers}")
     start_time = pd.Timestamp.now()
-    logger.info("Extracting Optimus features")
     features, _ = get_features(
         filtered_coords,
         slide_path,
@@ -114,7 +120,7 @@ def _extract_optimus_features(filtered_coords, slide_path, attrs, num_workers):
         model_type=ModelType.OPTIMUS,
         model_path="data/optimus.pkl",
         num_workers=num_workers,
-        batch_size=64,
         use_gpu=True,
     )
     end_time = pd.Timestamp.now()

         num_workers = max(num_workers, 8)
         logger.info(f"Running CTransPath with num_workers={num_workers}")
+    # Use larger batch size on H100 for better throughput
+    batch_size = 128 if IS_ZEROGPU else 64
     start_time = pd.Timestamp.now()
+    logger.info(f"Extracting CTransPath features with batch_size={batch_size}")
     ctranspath_features, _ = get_features(
         coords,
         slide_path,
         model_type=ModelType.CTRANSPATH,
         model_path="data/ctranspath.pth",
         num_workers=num_workers,
+        batch_size=batch_size,
         use_gpu=True,
     )
     end_time = pd.Timestamp.now()
     return ctranspath_features, coords
+@spaces.GPU(duration=300)
 def _extract_optimus_features(filtered_coords, slide_path, attrs, num_workers):
     """Extract Optimus features on GPU.
         num_workers = max(num_workers, 8)
         logger.info(f"Running Optimus with num_workers={num_workers}")
+    # Use larger batch size on H100 for better throughput
+    batch_size = 128 if IS_ZEROGPU else 64
     start_time = pd.Timestamp.now()
+    logger.info(f"Extracting Optimus features with batch_size={batch_size}")
     features, _ = get_features(
         filtered_coords,
         slide_path,
         model_type=ModelType.OPTIMUS,
         model_path="data/optimus.pkl",
         num_workers=num_workers,
+        batch_size=batch_size,
         use_gpu=True,
     )
     end_time = pd.Timestamp.now()