| # Train LiDAR-Perfect Depth on top of a pretrained PPD checkpoint. | |
| # | |
| # Stage 1 (image pretrain @512²): trains only the sparse-prompt encoder + gate | |
| # on Hypersim with simulated sparse-LiDAR; DiT backbone frozen. | |
| # Stage 2 (image finetune @1024×768): unfreezes the DiT (optional) and mixes | |
| # Hypersim + UrbanSyn + UnrealStereo4K + VKITTI2 + TartanAir. | |
| # Stage 3 (video finetune): adds the temporal Kalman filter loop on short clips. | |
| # | |
| # Pre-reqs: | |
| # * checkpoints/ppd.pth <- PPD pretrained weights | |
| # * checkpoints/depth_anything_v2_vitl.pth <- DA-V2 ViT-L semantics | |
| # * datasets extracted under /mnt/sig/datasets/ <- see datasets/README.md | |
| set -e | |
| # Stage 1: image pretrain (Hypersim only, 512×512) | |
| python main.py --cfg_file ppd/configs/lpd_pretrain.yaml pl_trainer.devices=1 | |
| # Stage 2 (uncomment after stage 1 produces a checkpoint): | |
| # python main.py --cfg_file ppd/configs/lpd_finetune.yaml pl_trainer.devices=8 | |
| # Stage 3 (uncomment for video): | |
| # python main.py --cfg_file ppd/configs/lpd_video.yaml pl_trainer.devices=8 | |