learn2splat / sparse /config.yaml
SteEsp's picture
Upload folder using huggingface_hub
44cf072 verified
loss:
mse:
weight: 1.0
lpips:
weight: 0.5
apply_after_step: 0
perceptual_loss: true
deltas:
weight: 1
exclude_by_norm_grad: true
exclude_by_norm_grad_opposite: true
eps: 1.0e-08
apply_after_step: 100
dataset:
view_sampler:
name: boundedv2
num_target_views: 6
num_context_views: 8
min_distance_between_context_views: 24
max_distance_between_context_views: 45
max_distance_to_context_views: 0
context_gap_warm_up_steps: 10000
target_gap_warm_up_steps: 0
initial_min_distance_between_context_views: 20
initial_max_distance_between_context_views: 30
initial_max_distance_to_context_views: 0
extra_views_sampling_strategy: farthest_point
target_views_replace_sample: false
name: dl3dv
roots:
- datasets/dl3dv-480p-chunks
make_baseline_1: false
augment: true
image_shape:
- 256
- 448
background_color:
- 0.0
- 0.0
- 0.0
cameras_are_circular: false
baseline_epsilon: 0.001
max_fov: 100.0
skip_bad_shape: true
near: 0.01
far: 200.0
baseline_scale_bounds: false
shuffle_val: true
test_len: -1
test_chunk_interval: 1
sort_target_index: true
sort_context_index: true
train_times_per_scene: 1
test_times_per_scene: 1
ori_image_shape:
- 270
- 480
overfit_to_scene: null
overfit_max_views: 148
use_index_to_load_chunk: false
mix_tartanair: false
no_mix_test_set: true
load_depth: false
center_pose: false
opencv_pose_format: true
min_views: 0
max_views: 0
highres: false
mix_re10k: false
re10k_min_view_dist: 40
re10k_max_view_dist: 300
pose_align_first_view: false
pose_align_middle_view: false
scale_extrinsics: 1.0
metric_scale_align_dl3dv: false
load_remain_context: false
num_remain_context: 8
random_crop: false
min_size:
- 384
- 512
max_size:
- 512
- 960
scene_trainer:
scene_initializer:
per_pixel: true
per_view: true
name: resplat
num_depth_candidates: 128
num_surfaces: 1
gaussians_per_pixel: 1
gaussian_adapter:
gaussian_scale_min: 0.5
gaussian_scale_max: 0.3
sh_degree: 3
exp_scale: false
softplus_scale: true
clamp_min_scale: 1.0e-06
scale_detach_depth: false
exp_scale_bias: 4.0
no_rotate_sh: true
no_sh_mask: true
init_rotation_identity: false
d_feature: 128
visualizer:
num_samples: 8
min_resolution: 256
export_ply: false
unimatch_weights_path: pretrained/gmdepth-scale1-resumeflowthings-scannet-5d9d7964.pth
multiview_trans_attn_split: 2
costvolume_unet_feat_dim: 128
costvolume_unet_channel_mult:
- 1
- 1
- 1
costvolume_unet_attn_res: []
depth_unet_feat_dim: 64
depth_unet_attn_res: []
depth_unet_channel_mult:
- 1
- 1
- 1
downscale_factor: 4
shim_patch_size: 4
local_mv_match: 2
monodepth_vit_type: vits
supervise_intermediate_depth: true
return_depth: true
num_scales: 1
upsample_factor: 8
lowest_feature_resolution: 8
depth_unet_channels: 128
grid_sample_disable_cudnn: false
large_gaussian_head: false
color_large_unet: false
init_sh_input_img: true
feature_upsampler_channels: 64
gaussian_regressor_channels: 256
unet_gaussian_regressor: false
resnet_gaussian_regressor: false
train_depth_only: false
pt_head: true
pt_heads: 1
init_pt_with_mv_attn: false
init_pt_with_mv_attn_lowres: false
pt_head_channels: null
pt_head_concat_img: false
pt_head_conv: false
multi_scale_pt: false
attn_proj_channels: 64
fps_num_samples: null
knn_samples: 16
post_norm: false
no_rpe: true
no_knn_attn: false
num_blocks: 4
pt_downsample: 0
fps_agg_func: attn
subsample_method: fps
add_pt_residual: true
pt_pred_residual_position: false
freeze_depth: false
use_gt_depth: false
separate_depth_color: false
separate_depth_type: small
separate_depth_gaussian_scale: false
sample_log_depth: true
bilinear_upsample_depth: false
no_upsample_depth: false
return_lowres_depth: false
foundationstereo: false
fstereo_num_refine: 1
lvsm_gaussian_regressor: false
lvsm_layers: 6
latent_gs: true
latent_downsample: 4
fixed_latent_size: true
latent_gs_img_interp: area
dpt_head_depth: false
latent_dpt_upsampler: false
latent_dpt_upsampler_no_concat: false
light_dpt_feature: false
avgpool_depth: false
nearest_down_depth: false
predict_scale: false
norm_by_points: false
no_pred_depth_range: false
point_dist_init_gaussian_scale: false
resizeconv_upsampler: false
depth_pred_half_res: false
use_amp: true
pt_head_amp: true
use_fsdp: false
use_checkpointing: false
init_use_checkpointing: false
new_gaussian_order: true
rotate_quat_to_world: false
refine_rotate_quat_to_world: false
refine_no_use_covariance: false
latent_new_reshape: false
ptv3: false
ptv3_grid_size: 0.1
no_pixel_offset: false
init_gaussian_multiple: 1
deform_sample_depth: false
deform_sample_depth_debug: false
scene_optimizer:
refiner:
name: none
do_densify: false
do_prune: false
do_opacity_reset: false
cap_max: -1
noise_lr: 0.0
pause_refine_after_reset: 0
refine_every: 999999999
reset_every: 999999999
refine_start_iter: 999999999
refine_stop_iter: 999999999
refine_scale2d_stop_iter: 0
grow_grad2d: 0.0
grow_scale3d: 0.0
prune_scale3d: 0.0
prune_scale2d: 0.0
grow_scale2d: 0.0
min_opacity: 0.0
prune_zero_radii: false
reduce_opacity: false
reduce_factor: 0.0
reduce_every: 0
lr_scheduler:
lr_data:
_base: 1
_means: 1
_scales: 1
_quats: 1
_opacities: 1
_sh0: 1
_shN: 1
apply_scheduler:
_base: false
_means: false
_scales: false
_quats: false
_opacities: false
_sh0: false
_shN: false
name: none
no_refine_mean: false
no_refine_scale: false
no_refine_rotation: false
no_refine_opacity: false
no_refine_sh0: false
no_refine_shN: false
name: clogs
no_render_error: false
refine_sh_only: false
num_basic_refine_blocks: 4
num_refine_blocks: 1
input_error_lpips_features: false
input_error_pool_vgg_features: false
input_error_use_all_vgg_features: false
input_error_vit_feature: false
input_error_resnet_feature: true
inpu_error_no_freeze_resnet_feature: false
input_error_shallow_resnet_feature: false
input_error_resnet_feature_layers: 18
input_error_convnext_feature: false
input_error_convnext_feature_size: small
input_error_concat_feature: false
input_error_concat_feature_cosine: false
input_error_cosine_feature: false
input_error_add_feature: false
input_error_concat_rgb_feature_error: false
concat_init_state: false
replace_init_state: false
state_channels: 256
refine_block_rmsnorm: false
refine_block_layernorm: false
pt_qk_norm: false
norm_pt_block: false
refine_gaussian_multiple: 1
refine_residual_init_state: false
clamp_refine_max_scale: 3.0
clamp_min_scale: 1.0e-06
clamp_min_raw_opacities: -7
clamp_max_raw_opacities: 7
gaussian_head_multiple: 1
update_head_concat_img: false
update_head_layer_num: 2
update_head_act: gelu
update_head_final_act: identity
update_head_scale_mag: false
update_head_scalar_scale: true
update_head_scalar_scale_act: relu
update_head_hidden_dim_matches: "output"
update_attn_proj_channels: 64
update_no_knn_attn: false
update_no_tran_block_norm: false
update_tran_block_act: gelu
multi_gaussian_scale_smaller: false
init_gaussian_multiple: 1
refine_condition_pt_feature: true
input_error_no_abs: false
reinit_gaussian_when_refine_multiple: false
refine_same_num_points: false
input_error_no_shuffle: false
input_error_cache_resnet_feature: false
input_error_view_pool_resnet_feature: false
input_error_global_pool_resnet_feature: false
init_state_wo_features: false
init_state_type: constant
init_state_scale: 0
pt_heads: 1
refine_with_mv_attn: false
refine_with_mv_attn_lowres: false
refine_no_mv_attn: false
mv_attn_conv_with_norm: false
refine_mv_shuffle_attn: false
refine_mv_attn_with_pos_enc: false
refine_shuffle_attn_no_norm: false
refine_mv_unimatch_attn: false
refine_knn_samples: 16
refine_multi_scale_pt: false
input_alpha: false
input_depth: false
input_depth_smooth_error: false
input_error: false
input_zero_gaussian: false
input_zero_state: false
input_zero_init_state: false
input_error_cross_attn: false
input_error_cross_attn_blocks: 1
input_error_cross_attn_with_mlp: false
input_error_radii_averaged: false
input_error_additional_cross_attn: false
input_error_num_intermediate_views: 8
input_error_mv_attn: false
input_error_mv_attn_blocks: 2
input_error_mv_attn_lowres: false
input_error_mv_attn_proj_channels: 0
input_error_lowres_attn_down_factor: 4
input_error_lowres_attn_pos_enc: false
input_error_mv_attn_swin: false
input_error_num_views: 0
input_error_remain_context: false
input_error_merge_remain_context: false
input_error_warp_remain_context: false
input_error_random_num_remain_context: false
input_error_num_remain_context_test: 0
input_error_warp_input_view: false
window_local_refine: false
window_global_refine: false
window_local_global_refine: false
update_window_size: 0
local_gaussian_render: false
input_error_half_res: false
input_gradient: true
input_gradient_log: false
input_gradient_log_clip_deltas: 0.001
input_gradient_scale: 1.0
gradient_update_scale: 1.0
input_gradient_with_ssim_loss: true
input_gradient_same_loss: false
scale_residual_grads: false
train_min_refine: 1
train_max_refine: 6
local_global_update: false
num_global_update: 0
train_global_update_only: false
random_update_with_size: false
ptv3: false
ptv3_grid_size: 0.1
use_amp: true
pt_head_amp: true
pt_update_amp: true
use_checkpointing: false
recurrent_use_checkpointing: false
debug_refine_update_module: true
debug_refine_mlp: false
debug_refine_mlp_layers: 0
debug_refine_mlp_fixed_init: false
input_gradient_normalize: true
input_gradient_normalize_type: adam
input_normalize_state: false
input_normalize_gaussians: false
predict_state_scale: true
opt_scales_before_act: false
scale_initial_opacities: 1.0
sh_d: 16
local_prune_zero_radii: false
local_prune_low_weights: false
local_prune_low_weights_thresh: -1
update_only_nonzero_grad: true
experimental_run: false
experimental_update:
_base: true
_means: true
_scales: true
_quats: true
_opacities: true
_sh0: true
_shN: true
experimental_use_grads: false
experimental_use_norm_grads:
_base: false
_means: false
_scales: false
_quats: false
_opacities: false
_sh0: false
_shN: false
experimental_lr:
_base: 1
_means: 0.00016
_scales: 0.005
_opacities: 0.05
_quats: 0.001
_sh0: 0.0025
_shN: 0.000125
sample_init_gaussians: 0
use_time_encoding: false
time_encoding_max_steps: 2000
decoder:
name: gsplat
use_covariances: false
use_fsdp: false
train_scene_init: false
train_scene_opt: true
num_update_steps: 4
iter_batch_size: -1
iter_batch_size_min: -1
iter_batch_size_max: -1
initializer:
num_depth_candidates: 128
costvolume_unet_feat_dim: 128
costvolume_unet_channel_mult:
- 1
- 1
- 1
costvolume_unet_attn_res:
- 4
gaussians_per_pixel: 1
depth_unet_feat_dim: 32
depth_unet_attn_res:
- 16
depth_unet_channel_mult:
- 1
- 1
- 1
- 1
- 1
shim_patch_size: 16
test:
postprocessing:
steps: 2000
compute_metrics_every: 100
lr_data:
_base: 1
_means: 1
_scales: 1
_opacities: 1
_quats: 1
_sh0: 1
_shN: 1
scheduler: null
scheduler_warm_up_ratio: 0.01
__target__: src.scene_trainer.postprocessing.NoPostProcessCfg
name: none
output_path: null
compute_scores: true
compute_scores_metrics: [psnr,ssim,lpips]
eval_time_skip_steps: 0
eval_initialization: true
save_render_image: false
save_gt_image: false
save_render_depth: false
save_gt_depth: false
save_error_image: false
save_error_depth: false
save_video: false
save_depth: false
save_depth_npy: false
save_depth_concat_img: false
save_gaussian: false
save_poses: false
no_align_to_view: false
save_point_cloud: false
render_chunk_size: null
stablize_camera: false
stab_camera_kernel: 50
eval_context_views: false
inference_window_size: null
profile_model: false
save_colmap_train_test_views: false
ori_colmap_data_path: null
adam_optimizer_step: 0
save_at_iters: null
save_every_freq:
- 1
- 10
- 100
- 500
save_every_steps:
- 0
- 10
- 100
- 1000
skip_if_outputs_exist: false
dec_chunk_size: 30
wandb:
project: ablation-dl3dv-8views
entity: placeholder
name: dl3dv
mode: online
id: null
notes: ''
tags:
- dl3dv
- 270x480
mode: train
data_loader:
train:
num_workers: 10
persistent_workers: true
batch_size: 1
seed: 1234
test:
num_workers: 4
persistent_workers: false
batch_size: 1
seed: 2345
val:
num_workers: 1
persistent_workers: true
batch_size: 1
seed: 3456
meta_optimizer:
lr: 0.0001
lr_monodepth: 0.0
lr_depth: 0.0
warm_up_steps: 2000
weight_decay: 0.01
warm_up_ratio: 0.01
adamw_8bit: false
checkpointing:
load: null
every_n_train_steps: 1000
save_top_k: 5
pretrained_model: checkpoints/optgs/unified-dl3dv-8views/init/checkpoints/epoch_20-step_100000.ckpt
pretrained_model_rel_dir: ${checkpoint_rel_dir:${checkpointing.pretrained_model}}
pretrained_monodepth: null
pretrained_mvdepth: null
pretrained_depth: null
pretrained_scale_predictor: null
pretrained_depth_teacher: null
no_strict_load: true
resume: false
no_resume_upsampler: false
partial_load: false
freeze_mono_vit: false
freeze_mono_vit: false
resume_update_module: null
train:
depth_mode: null
extended_visualization: false
print_log_every_n_steps: 100
eval_model_every_n_val: 2
eval_data_length: 999999
eval_deterministic: false
eval_time_skip_steps: 3
eval_save_model: true
l1_loss: true
intermediate_loss_weight: 0.9
no_viz_video: false
eval_depth: false
forward_depth_only: false
train_ignore_large_loss: 0.0
no_log_projections: true
no_log_video: true
depth_loss_weight: 0.0
log_depth_loss: true
depth_smooth_loss_weight: 0.0
depth_smooth_loss_nonorm: false
depth_smooth_loss_weight_nvs: 0.0
monodepth_loss_weight: 0.0
depth_teacher_loss_weight: 0.0
viz_depth_teacher: false
eval_render_depth: false
render_depth_loss_weight: 0.0
viz_render_depth: false
use_gt_depth_range: false
depth_range_from_disparity: false
max_disparity: 128.0
min_disparity: 4.0
img_warp_loss_weight: 0.0
warp_loss_start_step: 5000
loss_on_input_views: true
loss_on_target_views: true
loss_on_input_views_num: 4
train_window_size: null
half_res_lpips_loss: false
viz_depth_separate: false
use_replay_buffer: true
replay_buffer_cfg:
capacity: 20
sample_batch_size: 1
sample_prob: 0.7
insert_prob: 0.99
return_prob: 0.99
simulate_ahead: true
simulate_ahead_min_steps: 1
simulate_ahead_max_steps: 50
simulate_ahead_grow: 10000
max_t: null
push_only_if_not_full: false
seed: 111123
meta_trainer:
max_steps: 100000
val_check_interval: 0.25
gradient_clip_val: 0.5
num_sanity_val_steps: 2
eval_index: null
limit_test_batches: 1.0
limit_train_batches: 1.0
num_nodes: 1
output_dir: !!python/object/apply:src.misc.io.CustomPath
- checkpoints
- rebuttal
- dl3dv-8views
- submitted
use_plugins: false
log_slurm_id: true