| META_INTERNAL=False torchrun --nnodes=4 --nproc_per_node=8 train.py \ | |
| --train_dataset " \ | |
| 15000 @ MVDataset(split='all', ROOT='trajectories/scannet_0.3_0.7', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]]) + \ | |
| 15000 @ MVDataset(split='all', ROOT='trajectories/scannet_0.3_1.0', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]]) + \ | |
| 15000 @ MVDataset(split='all', ROOT='trajectories/scannetpp_0.3_0.7', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]]) + \ | |
| 15000 @ MVDataset(split='all', ROOT='trajectories/scannetpp_0.3_1.0', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]]) + \ | |
| 30000 @ MVDataset(split='all', ROOT='trajectories/habitatSim_star_step_2.0', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, render_start = 8, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]]) + \ | |
| 30000 @ MVDataset(split='all', ROOT='trajectories/habitatSim_tree_step_1.0', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, render_start = 8, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]]) + \ | |
| 30000 @ MVDataset(split='all', ROOT='trajectories/habitatSim_tree_step_2.0', aug_crop=16, mask_bg='rand', resolution=224, transform=ColorJitter, num_views=10, num_render_views=2, random_order = True, random_render_order = False, render_start = 8, dps_name = 'dps_train.h5', random_nv_nr = [[10,2]])" \ | |
| --test_dataset " \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/habitatSim_test', resolution=224, seed=777, fix_order=True, num_views=30, num_render_views=6, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'hs_tdf_2_testFull_30_6', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/habitatSim_test', resolution=224, seed=777, fix_order=True, num_views=5, num_render_views=1, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'hs_tdf_2_testFull_5_1', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/habitatSim_test', resolution=224, seed=777, fix_order=True, num_views=10, num_render_views=2, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'hs_tdf_2_testFull_10_2', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/scannet_test', resolution=224, seed=777, fix_order=True, num_views=30, num_render_views=6, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'sc_1_30_6', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/scannet_test', resolution=224, seed=777, fix_order=True, num_views=5, num_render_views=1, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'sc_1_5_1', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/scannet_test', resolution=224, seed=777, fix_order=True, num_views=10, num_render_views=2, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'sc_1_10_2', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/mp3d_test', resolution=224, seed=777, fix_order=True, num_views=30, num_render_views=6, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'mp3d_tdf_2_testFull_30_6', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/mp3d_test', resolution=224, seed=777, fix_order=True, num_views=5, num_render_views=1, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'mp3d_tdf_2_testFull_5_1', n_ref = 4) + \ | |
| MVDataset(n_all=1000, split='all', ROOT='trajectories/mp3d_test', resolution=224, seed=777, fix_order=True, num_views=10, num_render_views=2, render_start = 24, dps_name = 'dps_test.h5', tb_name = 'mp3d_tdf_2_testFull_10_2', n_ref = 4)" \ | |
| --model "AsymmetricCroCo3DStereoMultiView(pos_embed='RoPE100', img_size=(224, 224), head_type='linear', output_mode='pts3d', depth_mode=('exp', -inf, inf), conf_mode=('exp', 1, 1e9), enc_embed_dim=1024, enc_depth=24, enc_num_heads=16, dec_embed_dim=768, dec_depth=12, dec_num_heads=12, GS = True, sh_degree=0, pts_head_config = {'skip':True})" \ | |
| --train_criterion "GSRenderLoss(L21, norm_mode='avg_dis', mv = True, scale_scaled = True, use_gt_pcd = False, lpips_coeff = 1.0, rgb_coeff = 1.0, use_img_rgb = True, local_loss_coeff=0.0) + ConfLoss(Regr3D(L21, norm_mode='avg_dis', mv = True), alpha=0.2)" \ | |
| --test_criterion "GSRenderLoss(L21, norm_mode='avg_dis', mv = True, render_included = True, scale_scaled = True, use_img_rgb = True, local_loss_coeff=0.0) + Regr3D_ScaleShiftAllInv(L21, gt_scale=True, mv = True)" \ | |
| --pretrained "checkpoints/DUSt3R_ViTLarge_BaseDecoder_224_linear.pth" \ | |
| --lr 0.00015 --min_lr 0.000001 --warmup_epochs 1 --epochs 100 --batch_size 8 --accum_iter 2 --save_freq 1 --keep_freq 5 --eval_freq 5 --num_workers 16 \ | |
| --output_dir outputs/MVD | |