loss: mse: weight: 1.0 lpips: weight: 0.5 apply_after_step: 0 perceptual_loss: true deltas: weight: 1 exclude_by_norm_grad: true exclude_by_norm_grad_opposite: true eps: 1.0e-08 apply_after_step: 100 dataset: view_sampler: name: boundedv2 num_target_views: 6 num_context_views: 8 min_distance_between_context_views: 24 max_distance_between_context_views: 45 max_distance_to_context_views: 0 context_gap_warm_up_steps: 10000 target_gap_warm_up_steps: 0 initial_min_distance_between_context_views: 20 initial_max_distance_between_context_views: 30 initial_max_distance_to_context_views: 0 extra_views_sampling_strategy: farthest_point target_views_replace_sample: false name: dl3dv roots: - datasets/dl3dv-480p-chunks make_baseline_1: false augment: true image_shape: - 256 - 448 background_color: - 0.0 - 0.0 - 0.0 cameras_are_circular: false baseline_epsilon: 0.001 max_fov: 100.0 skip_bad_shape: true near: 0.01 far: 200.0 baseline_scale_bounds: false shuffle_val: true test_len: -1 test_chunk_interval: 1 sort_target_index: true sort_context_index: true train_times_per_scene: 1 test_times_per_scene: 1 ori_image_shape: - 270 - 480 overfit_to_scene: null overfit_max_views: 148 use_index_to_load_chunk: false mix_tartanair: false no_mix_test_set: true load_depth: false center_pose: false opencv_pose_format: true min_views: 0 max_views: 0 highres: false mix_re10k: false re10k_min_view_dist: 40 re10k_max_view_dist: 300 pose_align_first_view: false pose_align_middle_view: false scale_extrinsics: 1.0 metric_scale_align_dl3dv: false load_remain_context: false num_remain_context: 8 random_crop: false min_size: - 384 - 512 max_size: - 512 - 960 scene_trainer: scene_initializer: per_pixel: true per_view: true name: resplat num_depth_candidates: 128 num_surfaces: 1 gaussians_per_pixel: 1 gaussian_adapter: gaussian_scale_min: 0.5 gaussian_scale_max: 0.3 sh_degree: 3 exp_scale: false softplus_scale: true clamp_min_scale: 1.0e-06 scale_detach_depth: false exp_scale_bias: 4.0 no_rotate_sh: true no_sh_mask: true init_rotation_identity: false d_feature: 128 visualizer: num_samples: 8 min_resolution: 256 export_ply: false unimatch_weights_path: pretrained/gmdepth-scale1-resumeflowthings-scannet-5d9d7964.pth multiview_trans_attn_split: 2 costvolume_unet_feat_dim: 128 costvolume_unet_channel_mult: - 1 - 1 - 1 costvolume_unet_attn_res: [] depth_unet_feat_dim: 64 depth_unet_attn_res: [] depth_unet_channel_mult: - 1 - 1 - 1 downscale_factor: 4 shim_patch_size: 4 local_mv_match: 2 monodepth_vit_type: vits supervise_intermediate_depth: true return_depth: true num_scales: 1 upsample_factor: 8 lowest_feature_resolution: 8 depth_unet_channels: 128 grid_sample_disable_cudnn: false large_gaussian_head: false color_large_unet: false init_sh_input_img: true feature_upsampler_channels: 64 gaussian_regressor_channels: 256 unet_gaussian_regressor: false resnet_gaussian_regressor: false train_depth_only: false pt_head: true pt_heads: 1 init_pt_with_mv_attn: false init_pt_with_mv_attn_lowres: false pt_head_channels: null pt_head_concat_img: false pt_head_conv: false multi_scale_pt: false attn_proj_channels: 64 fps_num_samples: null knn_samples: 16 post_norm: false no_rpe: true no_knn_attn: false num_blocks: 4 pt_downsample: 0 fps_agg_func: attn subsample_method: fps add_pt_residual: true pt_pred_residual_position: false freeze_depth: false use_gt_depth: false separate_depth_color: false separate_depth_type: small separate_depth_gaussian_scale: false sample_log_depth: true bilinear_upsample_depth: false no_upsample_depth: false return_lowres_depth: false foundationstereo: false fstereo_num_refine: 1 lvsm_gaussian_regressor: false lvsm_layers: 6 latent_gs: true latent_downsample: 4 fixed_latent_size: true latent_gs_img_interp: area dpt_head_depth: false latent_dpt_upsampler: false latent_dpt_upsampler_no_concat: false light_dpt_feature: false avgpool_depth: false nearest_down_depth: false predict_scale: false norm_by_points: false no_pred_depth_range: false point_dist_init_gaussian_scale: false resizeconv_upsampler: false depth_pred_half_res: false use_amp: true pt_head_amp: true use_fsdp: false use_checkpointing: false init_use_checkpointing: false new_gaussian_order: true rotate_quat_to_world: false refine_rotate_quat_to_world: false refine_no_use_covariance: false latent_new_reshape: false ptv3: false ptv3_grid_size: 0.1 no_pixel_offset: false init_gaussian_multiple: 1 deform_sample_depth: false deform_sample_depth_debug: false scene_optimizer: refiner: name: none do_densify: false do_prune: false do_opacity_reset: false cap_max: -1 noise_lr: 0.0 pause_refine_after_reset: 0 refine_every: 999999999 reset_every: 999999999 refine_start_iter: 999999999 refine_stop_iter: 999999999 refine_scale2d_stop_iter: 0 grow_grad2d: 0.0 grow_scale3d: 0.0 prune_scale3d: 0.0 prune_scale2d: 0.0 grow_scale2d: 0.0 min_opacity: 0.0 prune_zero_radii: false reduce_opacity: false reduce_factor: 0.0 reduce_every: 0 lr_scheduler: lr_data: _base: 1 _means: 1 _scales: 1 _quats: 1 _opacities: 1 _sh0: 1 _shN: 1 apply_scheduler: _base: false _means: false _scales: false _quats: false _opacities: false _sh0: false _shN: false name: none no_refine_mean: false no_refine_scale: false no_refine_rotation: false no_refine_opacity: false no_refine_sh0: false no_refine_shN: false name: clogs no_render_error: false refine_sh_only: false num_basic_refine_blocks: 4 num_refine_blocks: 1 input_error_lpips_features: false input_error_pool_vgg_features: false input_error_use_all_vgg_features: false input_error_vit_feature: false input_error_resnet_feature: true inpu_error_no_freeze_resnet_feature: false input_error_shallow_resnet_feature: false input_error_resnet_feature_layers: 18 input_error_convnext_feature: false input_error_convnext_feature_size: small input_error_concat_feature: false input_error_concat_feature_cosine: false input_error_cosine_feature: false input_error_add_feature: false input_error_concat_rgb_feature_error: false concat_init_state: false replace_init_state: false state_channels: 256 refine_block_rmsnorm: false refine_block_layernorm: false pt_qk_norm: false norm_pt_block: false refine_gaussian_multiple: 1 refine_residual_init_state: false clamp_refine_max_scale: 3.0 clamp_min_scale: 1.0e-06 clamp_min_raw_opacities: -7 clamp_max_raw_opacities: 7 gaussian_head_multiple: 1 update_head_concat_img: false update_head_layer_num: 2 update_head_act: gelu update_head_final_act: identity update_head_scale_mag: false update_head_scalar_scale: true update_head_scalar_scale_act: relu update_head_hidden_dim_matches: "output" update_attn_proj_channels: 64 update_no_knn_attn: false update_no_tran_block_norm: false update_tran_block_act: gelu multi_gaussian_scale_smaller: false init_gaussian_multiple: 1 refine_condition_pt_feature: true input_error_no_abs: false reinit_gaussian_when_refine_multiple: false refine_same_num_points: false input_error_no_shuffle: false input_error_cache_resnet_feature: false input_error_view_pool_resnet_feature: false input_error_global_pool_resnet_feature: false init_state_wo_features: false init_state_type: constant init_state_scale: 0 pt_heads: 1 refine_with_mv_attn: false refine_with_mv_attn_lowres: false refine_no_mv_attn: false mv_attn_conv_with_norm: false refine_mv_shuffle_attn: false refine_mv_attn_with_pos_enc: false refine_shuffle_attn_no_norm: false refine_mv_unimatch_attn: false refine_knn_samples: 16 refine_multi_scale_pt: false input_alpha: false input_depth: false input_depth_smooth_error: false input_error: false input_zero_gaussian: false input_zero_state: false input_zero_init_state: false input_error_cross_attn: false input_error_cross_attn_blocks: 1 input_error_cross_attn_with_mlp: false input_error_radii_averaged: false input_error_additional_cross_attn: false input_error_num_intermediate_views: 8 input_error_mv_attn: false input_error_mv_attn_blocks: 2 input_error_mv_attn_lowres: false input_error_mv_attn_proj_channels: 0 input_error_lowres_attn_down_factor: 4 input_error_lowres_attn_pos_enc: false input_error_mv_attn_swin: false input_error_num_views: 0 input_error_remain_context: false input_error_merge_remain_context: false input_error_warp_remain_context: false input_error_random_num_remain_context: false input_error_num_remain_context_test: 0 input_error_warp_input_view: false window_local_refine: false window_global_refine: false window_local_global_refine: false update_window_size: 0 local_gaussian_render: false input_error_half_res: false input_gradient: true input_gradient_log: false input_gradient_log_clip_deltas: 0.001 input_gradient_scale: 1.0 gradient_update_scale: 1.0 input_gradient_with_ssim_loss: true input_gradient_same_loss: false scale_residual_grads: false train_min_refine: 1 train_max_refine: 6 local_global_update: false num_global_update: 0 train_global_update_only: false random_update_with_size: false ptv3: false ptv3_grid_size: 0.1 use_amp: true pt_head_amp: true pt_update_amp: true use_checkpointing: false recurrent_use_checkpointing: false debug_refine_update_module: true debug_refine_mlp: false debug_refine_mlp_layers: 0 debug_refine_mlp_fixed_init: false input_gradient_normalize: true input_gradient_normalize_type: adam input_normalize_state: false input_normalize_gaussians: false predict_state_scale: true opt_scales_before_act: false scale_initial_opacities: 1.0 sh_d: 16 local_prune_zero_radii: false local_prune_low_weights: false local_prune_low_weights_thresh: -1 update_only_nonzero_grad: true experimental_run: false experimental_update: _base: true _means: true _scales: true _quats: true _opacities: true _sh0: true _shN: true experimental_use_grads: false experimental_use_norm_grads: _base: false _means: false _scales: false _quats: false _opacities: false _sh0: false _shN: false experimental_lr: _base: 1 _means: 0.00016 _scales: 0.005 _opacities: 0.05 _quats: 0.001 _sh0: 0.0025 _shN: 0.000125 sample_init_gaussians: 0 use_time_encoding: false time_encoding_max_steps: 2000 decoder: name: gsplat use_covariances: false use_fsdp: false train_scene_init: false train_scene_opt: true num_update_steps: 4 iter_batch_size: -1 iter_batch_size_min: -1 iter_batch_size_max: -1 initializer: num_depth_candidates: 128 costvolume_unet_feat_dim: 128 costvolume_unet_channel_mult: - 1 - 1 - 1 costvolume_unet_attn_res: - 4 gaussians_per_pixel: 1 depth_unet_feat_dim: 32 depth_unet_attn_res: - 16 depth_unet_channel_mult: - 1 - 1 - 1 - 1 - 1 shim_patch_size: 16 test: postprocessing: steps: 2000 compute_metrics_every: 100 lr_data: _base: 1 _means: 1 _scales: 1 _opacities: 1 _quats: 1 _sh0: 1 _shN: 1 scheduler: null scheduler_warm_up_ratio: 0.01 __target__: src.scene_trainer.postprocessing.NoPostProcessCfg name: none output_path: null compute_scores: true compute_scores_metrics: [psnr,ssim,lpips] eval_time_skip_steps: 0 eval_initialization: true save_render_image: false save_gt_image: false save_render_depth: false save_gt_depth: false save_error_image: false save_error_depth: false save_video: false save_depth: false save_depth_npy: false save_depth_concat_img: false save_gaussian: false save_poses: false no_align_to_view: false save_point_cloud: false render_chunk_size: null stablize_camera: false stab_camera_kernel: 50 eval_context_views: false inference_window_size: null profile_model: false save_colmap_train_test_views: false ori_colmap_data_path: null adam_optimizer_step: 0 save_at_iters: null save_every_freq: - 1 - 10 - 100 - 500 save_every_steps: - 0 - 10 - 100 - 1000 skip_if_outputs_exist: false dec_chunk_size: 30 wandb: project: ablation-dl3dv-8views entity: placeholder name: dl3dv mode: online id: null notes: '' tags: - dl3dv - 270x480 mode: train data_loader: train: num_workers: 10 persistent_workers: true batch_size: 1 seed: 1234 test: num_workers: 4 persistent_workers: false batch_size: 1 seed: 2345 val: num_workers: 1 persistent_workers: true batch_size: 1 seed: 3456 meta_optimizer: lr: 0.0001 lr_monodepth: 0.0 lr_depth: 0.0 warm_up_steps: 2000 weight_decay: 0.01 warm_up_ratio: 0.01 adamw_8bit: false checkpointing: load: null every_n_train_steps: 1000 save_top_k: 5 pretrained_model: checkpoints/optgs/unified-dl3dv-8views/init/checkpoints/epoch_20-step_100000.ckpt pretrained_model_rel_dir: ${checkpoint_rel_dir:${checkpointing.pretrained_model}} pretrained_monodepth: null pretrained_mvdepth: null pretrained_depth: null pretrained_scale_predictor: null pretrained_depth_teacher: null no_strict_load: true resume: false no_resume_upsampler: false partial_load: false freeze_mono_vit: false freeze_mono_vit: false resume_update_module: null train: depth_mode: null extended_visualization: false print_log_every_n_steps: 100 eval_model_every_n_val: 2 eval_data_length: 999999 eval_deterministic: false eval_time_skip_steps: 3 eval_save_model: true l1_loss: true intermediate_loss_weight: 0.9 no_viz_video: false eval_depth: false forward_depth_only: false train_ignore_large_loss: 0.0 no_log_projections: true no_log_video: true depth_loss_weight: 0.0 log_depth_loss: true depth_smooth_loss_weight: 0.0 depth_smooth_loss_nonorm: false depth_smooth_loss_weight_nvs: 0.0 monodepth_loss_weight: 0.0 depth_teacher_loss_weight: 0.0 viz_depth_teacher: false eval_render_depth: false render_depth_loss_weight: 0.0 viz_render_depth: false use_gt_depth_range: false depth_range_from_disparity: false max_disparity: 128.0 min_disparity: 4.0 img_warp_loss_weight: 0.0 warp_loss_start_step: 5000 loss_on_input_views: true loss_on_target_views: true loss_on_input_views_num: 4 train_window_size: null half_res_lpips_loss: false viz_depth_separate: false use_replay_buffer: true replay_buffer_cfg: capacity: 20 sample_batch_size: 1 sample_prob: 0.7 insert_prob: 0.99 return_prob: 0.99 simulate_ahead: true simulate_ahead_min_steps: 1 simulate_ahead_max_steps: 50 simulate_ahead_grow: 10000 max_t: null push_only_if_not_full: false seed: 111123 meta_trainer: max_steps: 100000 val_check_interval: 0.25 gradient_clip_val: 0.5 num_sanity_val_steps: 2 eval_index: null limit_test_batches: 1.0 limit_train_batches: 1.0 num_nodes: 1 output_dir: !!python/object/apply:src.misc.io.CustomPath - checkpoints - rebuttal - dl3dv-8views - submitted use_plugins: false log_slurm_id: true