| loss: |
| stability: |
| weight: 1.0 |
| lpips: |
| apply_after_step: 0 |
| weight: 0.5 |
| perceptual_loss: true |
| mse: |
| weight: 1.0 |
| deltas: |
| weight: 1 |
| exclude_by_norm_grad: true |
| exclude_by_norm_grad_opposite: true |
| eps: 1.0e-08 |
| apply_after_step: 100 |
| dataset: |
| image_shape: |
| - 256 |
| - 448 |
| background_color: |
| - 0.0 |
| - 0.0 |
| - 0.0 |
| cameras_are_circular: false |
| overfit_to_scene: null |
| opencv_pose_format: false |
| pose_align_middle_view: false |
| test_start_idx: 0 |
| view_sampler: |
| name: boundedv2 |
| num_target_views: 6 |
| num_context_views: 64 |
| min_distance_between_context_views: -1 |
| max_distance_between_context_views: -1 |
| max_distance_to_context_views: 0 |
| context_gap_warm_up_steps: 10000 |
| target_gap_warm_up_steps: 0 |
| initial_min_distance_between_context_views: -1 |
| initial_max_distance_between_context_views: -1 |
| initial_max_distance_to_context_views: 0 |
| extra_views_sampling_strategy: farthest_point |
| target_views_replace_sample: false |
| name: dl3dv |
| roots: |
| - datasets/dl3dv-480p-chunks |
| make_baseline_1: false |
| augment: true |
| baseline_epsilon: 0.001 |
| max_fov: 100.0 |
| skip_bad_shape: true |
| near: 0.01 |
| far: 200.0 |
| baseline_scale_bounds: false |
| shuffle_val: true |
| test_len: -1 |
| test_chunk_interval: 1 |
| sort_target_index: true |
| sort_context_index: true |
| train_times_per_scene: 1 |
| test_times_per_scene: 1 |
| ori_image_shape: |
| - 270 |
| - 480 |
| overfit_max_views: 148 |
| use_index_to_load_chunk: false |
| mix_tartanair: false |
| no_mix_test_set: true |
| load_depth: false |
| center_pose: false |
| pose_align_first_view: false |
| scale_extrinsics: 1.0 |
| metric_scale_align_dl3dv: false |
| min_views: 0 |
| max_views: 0 |
| highres: false |
| mix_re10k: false |
| re10k_min_view_dist: 40 |
| re10k_max_view_dist: 300 |
| load_remain_context: false |
| num_remain_context: 8 |
| random_crop: false |
| min_size: |
| - 384 |
| - 512 |
| max_size: |
| - 512 |
| - 960 |
| index_name: index_colmap.json |
| scene_trainer: |
| scene_initializer: |
| per_pixel: false |
| per_view: false |
| train_min_gaussians_subsample: 0.1 |
| train_max_gaussians_subsample: 1.0 |
| eval_min_gaussians_subsample: null |
| eval_max_gaussians_subsample: null |
| train_fixed_gaussians_num: 70000 |
| eval_fixed_gaussians_num: 70000 |
| name: colmap |
| path: datasets/dl3dv-colmap-sfm |
| normalize_world_space: false |
| scaling_factor: 1.0 |
| init_opacity: 0.1 |
| sh_degree: 3 |
| dl3dv_settings: true |
| filter_zero_rgb: true |
| points3d_subdir: null |
| points3d_ply_filename: null |
| randomize_opacity: false |
| randomize_opacity_distribution: uniform |
| randomize_opacity_min: 0.0 |
| randomize_opacity_std: 0.05 |
| override_dataset_poses: true |
| scene_optimizer: |
| refiner: |
| name: none |
| do_densify: false |
| do_prune: false |
| do_opacity_reset: false |
| cap_max: -1 |
| noise_lr: 0.0 |
| pause_refine_after_reset: 0 |
| refine_every: 999999999 |
| reset_every: 999999999 |
| refine_start_iter: 999999999 |
| refine_stop_iter: 999999999 |
| refine_scale2d_stop_iter: 0 |
| grow_grad2d: 0.0 |
| grow_scale3d: 0.0 |
| prune_scale3d: 0.0 |
| prune_scale2d: 0.0 |
| grow_scale2d: 0.0 |
| min_opacity: 0.0 |
| prune_zero_radii: false |
| reduce_opacity: false |
| reduce_factor: 0.0 |
| reduce_every: 0 |
| lr_scheduler: |
| lr_data: |
| _base: 1 |
| _means: 1 |
| _scales: 1 |
| _quats: 1 |
| _opacities: 1 |
| _sh0: 1 |
| _shN: 1 |
| apply_scheduler: |
| _base: false |
| _means: false |
| _scales: false |
| _quats: false |
| _opacities: false |
| _sh0: false |
| _shN: false |
| name: none |
| input_gradients_chunk_size: -1 |
| no_refine_mean: false |
| no_refine_scale: false |
| no_refine_rotation: false |
| no_refine_opacity: false |
| no_refine_sh0: false |
| no_refine_shN: false |
| name: clogs |
| no_render_error: false |
| refine_sh_only: false |
| num_basic_refine_blocks: 4 |
| num_refine_blocks: 1 |
| concat_init_state: false |
| replace_init_state: false |
| state_channels: 256 |
| refine_block_rmsnorm: false |
| refine_block_layernorm: false |
| pt_qk_norm: false |
| norm_pt_block: false |
| refine_gaussian_multiple: 1 |
| refine_residual_init_state: false |
| clamp_refine_max_scale: 3.0 |
| clamp_min_scale: 1.0e-06 |
| clamp_min_raw_scales: -8.0 |
| clamp_max_raw_scales: 2.3 |
| clamp_min_raw_opacities: -7 |
| clamp_max_raw_opacities: 7 |
| gaussian_head_multiple: 1 |
| clamp_min_sh0: -10000000000.0 |
| clamp_max_sh0: 10000000000.0 |
| clamp_min_shs: -2.0 |
| clamp_max_shs: 2.0 |
| clamp_shs_soft: false |
| update_attn_proj_channels: 64 |
| update_no_knn_attn: false |
| update_no_tran_block_norm: false |
| update_tran_block_act: gelu |
| multi_gaussian_scale_smaller: false |
| init_gaussian_multiple: 1 |
| refine_condition_pt_feature: true |
| input_error_no_abs: false |
| reinit_gaussian_when_refine_multiple: false |
| refine_same_num_points: false |
| input_error_rgb_no_shuffle: false |
| input_error_cache_resnet_feature: false |
| input_error_view_pool_resnet_feature: false |
| input_error_global_pool_resnet_feature: false |
| init_state_wo_features: true |
| init_state_type: random |
| init_state_scale: 1.0 |
| pt_heads: 1 |
| refine_with_mv_attn: false |
| refine_with_mv_attn_lowres: false |
| refine_no_mv_attn: false |
| mv_attn_conv_with_norm: false |
| refine_mv_shuffle_attn: false |
| refine_mv_attn_with_pos_enc: false |
| refine_shuffle_attn_no_norm: false |
| refine_mv_unimatch_attn: false |
| refine_knn_samples: 4 |
| refine_multi_scale_pt: false |
| use_fused_attn: true |
| prune_invisible_gaussians: false |
| knn_idx_update_every: 1 |
| input_alpha: false |
| input_depth: false |
| input_depth_smooth_error: false |
| input_error: false |
| input_error_add_rgb_feature: false |
| input_error_lpips_feature: false |
| input_error_pool_vgg_features: false |
| input_error_use_all_vgg_features: false |
| input_error_vit_feature: false |
| input_error_resnet_feature: true |
| input_error_no_freeze_resnet_feature: false |
| input_error_shallow_resnet_feature: false |
| input_error_resnet_feature_layers: 18 |
| input_error_convnext_feature: false |
| input_error_convnext_feature_size: small |
| input_error_concat_feature: false |
| input_error_concat_feature_cosine: false |
| input_error_cosine_feature: false |
| input_error_add_feature: false |
| input_error_concat_rgb_feature: false |
| input_error_cross_attn: false |
| input_error_cross_attn_blocks: 1 |
| input_error_cross_attn_with_mlp: false |
| input_error_radii_averaged: false |
| input_error_additional_cross_attn: false |
| input_error_num_intermediate_views: 8 |
| input_error_mv_attn: false |
| input_error_mv_attn_blocks: 2 |
| input_error_mv_attn_lowres: false |
| input_error_mv_attn_proj_channels: 0 |
| input_error_lowres_attn_down_factor: 4 |
| input_error_lowres_attn_pos_enc: false |
| input_error_mv_attn_swin: false |
| input_error_num_views: 0 |
| input_error_remain_context: false |
| input_error_merge_remain_context: false |
| input_error_warp_remain_context: false |
| input_error_random_num_remain_context: false |
| input_error_num_remain_context_test: 0 |
| input_error_warp_input_view: false |
| input_zero_gaussian: false |
| input_zero_state: false |
| input_zero_init_state: false |
| input_gradient: true |
| input_gradient_log: false |
| input_gradient_log_clip_deltas: 0.001 |
| input_gradient_scale: 1.0 |
| gradient_update_scale: 1.0 |
| input_gradient_with_ssim_loss: true |
| input_gradient_same_loss: false |
| input_gradient_loss_reduction: mean_pixels_sum_views |
| scale_residual_grads: false |
| window_local_refine: false |
| window_global_refine: false |
| window_local_global_refine: false |
| update_window_size: 0 |
| local_gaussian_render: false |
| input_error_half_res: false |
| local_global_update: false |
| num_global_update: 0 |
| train_global_update_only: false |
| random_update_with_size: false |
| ptv3: false |
| ptv3_grid_size: 0.1 |
| use_amp: true |
| pt_head_amp: true |
| pt_update_amp: true |
| use_checkpointing: false |
| recurrent_use_checkpointing: false |
| debug_refine_update_module: true |
| debug_refine_mlp: false |
| debug_refine_mlp_layers: 0 |
| debug_refine_mlp_fixed_init: false |
| input_gradient_normalize: true |
| input_gradient_normalize_type: adam |
| input_normalize_state: false |
| input_normalize_gaussians: false |
| residual_state: false |
| predict_state_scale: true |
| predict_state_scale_norm: false |
| update_head_concat_img: false |
| update_head_layer_num: 2 |
| update_head_act: gelu |
| update_head_final_act: identity |
| update_head_hidden_dim_matches: input |
| update_head_scale_mag: false |
| update_head_scalar_scale: true |
| update_head_scalar_scale_act: relu |
| update_head_per_param_heads: false |
| update_head_per_param_hidden_dim: 48 |
| update_head_per_param_scales: false |
| opt_scales_before_act: true |
| scale_initial_opacities: 1.0 |
| sh_d: 16 |
| local_prune_zero_radii: false |
| local_prune_low_weights: false |
| local_prune_low_weights_thresh: -1 |
| update_only_nonzero_grad: true |
| experimental_run: false |
| experimental_update: |
| _base: true |
| _means: true |
| _scales: true |
| _quats: true |
| _opacities: true |
| _sh0: true |
| _shN: true |
| experimental_use_grads: false |
| experimental_use_norm_grads: |
| _base: false |
| _means: false |
| _scales: false |
| _quats: false |
| _opacities: false |
| _sh0: false |
| _shN: false |
| experimental_lr: |
| _base: 1 |
| _means: 0.00016 |
| _scales: 0.005 |
| _opacities: 0.05 |
| _quats: 0.001 |
| _sh0: 0.0025 |
| _shN: 0.000125 |
| sample_init_gaussians: 0 |
| use_time_encoding: false |
| time_encoding_max_steps: 2000 |
| decoder: |
| name: gsplat |
| use_covariances: false |
| rasterize_mode: classic |
| eps2d: 0.0001 |
| use_fsdp: false |
| train_scene_init: false |
| train_scene_opt: true |
| train_min_refine: 1 |
| train_max_refine: 6 |
| num_update_steps: 2000 |
| iter_batch_size: -1 |
| opt_batch_size: 8 |
| opt_batch_size_min: 0 |
| opt_batch_size_max: 0 |
| opt_batch_strategy: random |
| sh_degree_interval: 0 |
| test: |
| postprocessing: |
| steps: 0 |
| compute_metrics_every: 100 |
| lr_data: |
| _base: 1 |
| _means: 1 |
| _scales: 1 |
| _opacities: 1 |
| _quats: 1 |
| _sh0: 1 |
| _shN: 1 |
| scheduler: null |
| scheduler_warm_up_ratio: 0.01 |
| prior_steps: 0 |
| means_lr_final_ratio: 0.0625 |
| means_lr_delay_mult: 0.01 |
| means_lr_scale_by_scene_extent: true |
| chunk_size: -1 |
| adc: null |
| name: none |
| output_path: null |
| compute_scores: true |
| compute_scores_metrics: |
| - psnr |
| - ssim |
| - lpips |
| metrics_batch_size: 32 |
| eval_time_skip_steps: 0 |
| eval_initialization: true |
| save_render_image: false |
| save_render_image_last_only: false |
| save_gt_image: false |
| save_render_depth: false |
| save_gt_depth: false |
| save_error_image: false |
| save_error_depth: false |
| save_video: false |
| save_video_fixed_view: false |
| save_video_fixed_view_index: 0 |
| save_video_fixed_view_duplicate: 0 |
| save_video_fixed_iteration: false |
| save_video_fixed_iteration_indices: null |
| save_video_fixed_iteration_render_fixed_view: false |
| save_video_combined: false |
| save_video_combined_iterations: null |
| save_video_combined_fixed_iteration_length: 50 |
| save_depth: false |
| save_depth_npy: false |
| save_depth_concat_img: false |
| save_gaussian: false |
| save_poses: false |
| save_cameras_json: true |
| no_align_to_view: false |
| save_point_cloud: false |
| render_chunk_size: null |
| dec_chunk_size: 30 |
| stablize_camera: false |
| stab_camera_kernel: 50 |
| eval_context_views: false |
| inference_window_size: null |
| profile_model: false |
| save_colmap_train_test_views: false |
| ori_colmap_data_path: null |
| adam_optimizer_step: 0 |
| save_at_iters: |
| - 0 |
| - 1 |
| - 5 |
| - 10 |
| - 50 |
| - 100 |
| - 200 |
| - 300 |
| - 400 |
| - 500 |
| - 1000 |
| save_every_freq: |
| - 1 |
| - 10 |
| - 100 |
| - 500 |
| save_every_steps: |
| - 0 |
| - 10 |
| - 100 |
| - 1000 |
| skip_if_outputs_exist: false |
| scenes_filter: null |
| experimental_add_noise_to_images: false |
| experimental_add_noise_to_images_std: null |
| train: |
| replay_buffer_cfg: |
| capacity: 20 |
| sample_batch_size: 1 |
| sample_prob: 0.7 |
| insert_prob: 0.7 |
| return_prob: 0.99 |
| simulate_ahead: true |
| simulate_ahead_min_steps: 1 |
| simulate_ahead_max_steps: 50 |
| simulate_ahead_grow: 10000 |
| max_t: null |
| push_only_if_not_full: false |
| remove_strategy_when_full: oldest |
| depth_mode: null |
| extended_visualization: false |
| print_log_every_n_steps: 100 |
| eval_model_every_n_val: 2 |
| eval_data_length: 5 |
| eval_deterministic: false |
| eval_time_skip_steps: 3 |
| eval_save_model: true |
| l1_loss: true |
| intermediate_loss_weight: 0.9 |
| no_viz_video: false |
| eval_depth: false |
| forward_depth_only: false |
| train_ignore_large_loss: 0.0 |
| no_log_projections: true |
| no_log_video: true |
| depth_loss_weight: 0.0 |
| log_depth_loss: true |
| depth_smooth_loss_weight: 0.0 |
| depth_smooth_loss_nonorm: false |
| depth_smooth_loss_weight_nvs: 0.0 |
| monodepth_loss_weight: 0.0 |
| depth_teacher_loss_weight: 0.0 |
| viz_depth_teacher: false |
| eval_render_depth: false |
| render_depth_loss_weight: 0.0 |
| viz_render_depth: false |
| use_gt_depth_range: false |
| depth_range_from_disparity: false |
| max_disparity: 128.0 |
| min_disparity: 4.0 |
| img_warp_loss_weight: 0.0 |
| warp_loss_start_step: 5000 |
| loss_on_input_views: true |
| loss_on_target_views: true |
| loss_on_input_views_num: 4 |
| loss_on_target_views_num: 6 |
| train_window_size: null |
| half_res_lpips_loss: false |
| viz_depth_separate: false |
| scale_l2_loss_weight: 0.0 |
| sh_l2_loss_weight: 0.0 |
| opacity_l2_loss_weight: 0.0 |
| use_replay_buffer: true |
| wandb: |
| project: eccv |
| entity: placeholder |
| name: dl3dv |
| mode: online |
| id: null |
| notes: '' |
| tags: |
| - dl3dv |
| - 270x480 |
| mode: train |
| data_loader: |
| train: |
| num_workers: 10 |
| persistent_workers: true |
| batch_size: 1 |
| seed: 1234 |
| test: |
| num_workers: 4 |
| persistent_workers: false |
| batch_size: 1 |
| seed: 2345 |
| val: |
| num_workers: 1 |
| persistent_workers: true |
| batch_size: 1 |
| seed: 3456 |
| meta_optimizer: |
| lr: 0.0001 |
| lr_monodepth: 0.0 |
| lr_depth: 0.0 |
| warm_up_steps: 2000 |
| weight_decay: 0.01 |
| warm_up_ratio: 0.01 |
| adamw_8bit: false |
| checkpointing: |
| load: null |
| every_n_train_steps: 1000 |
| save_top_k: 5 |
| pretrained_model: null |
| pretrained_model_rel_dir: ${checkpoint_rel_dir:${checkpointing.pretrained_model}} |
| pretrained_monodepth: null |
| pretrained_mvdepth: null |
| pretrained_depth: null |
| pretrained_scale_predictor: null |
| pretrained_depth_teacher: null |
| no_strict_load: false |
| resume: false |
| no_resume_upsampler: false |
| partial_load: false |
| freeze_mono_vit: false |
| resume_update_module: null |
| pretrained_initializer: null |
| pretrained_optimizer: null |
| load_existing_cfg: false |
| seed: 111123 |
| meta_trainer: |
| max_steps: 50000 |
| val_check_interval: 0.25 |
| gradient_clip_val: 0.5 |
| num_sanity_val_steps: 1 |
| eval_index: null |
| limit_test_batches: 1.0 |
| limit_train_batches: 1.0 |
| num_nodes: 1 |
| output_dir: !!python/object/apply:src.misc.io.CustomPath |
| - checkpoints |
| - post_eccv |
| - sfm_init |
| - dl3dv_dense |
| - dense_knn_4_stability_or_rerun |
| use_plugins: false |
| log_slurm_id: true |
| version: 1 |
| profiling: |
| mode: none |
| debug_cfg: false |
|
|