AmandineBtto commited on
Commit
689130a
·
1 Parent(s): ac36c41

Adding NeRAF weights

Browse files
Files changed (49) hide show
  1. RAF/EmptyRoom_NeRAF/.DS_Store +0 -0
  2. RAF/EmptyRoom_NeRAF/NeRAF/.DS_Store +0 -0
  3. RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/.DS_Store +0 -0
  4. RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/config.yml +295 -0
  5. RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/dataparser_transforms.json +23 -0
  6. RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/nerfstudio_models/step-000090000.ckpt +3 -0
  7. RAF/FurnishedRoom_NeRAF/.DS_Store +0 -0
  8. RAF/FurnishedRoom_NeRAF/NeRAF/.DS_Store +0 -0
  9. RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/.DS_Store +0 -0
  10. RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/config.yml +295 -0
  11. RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/dataparser_transforms.json +23 -0
  12. RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/nerfstudio_models/step-000070000.ckpt +3 -0
  13. README.md +37 -0
  14. SoundSpaces/apartment_1_NeRAF/.DS_Store +0 -0
  15. SoundSpaces/apartment_1_NeRAF/NeRAF/.DS_Store +0 -0
  16. SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/.DS_Store +0 -0
  17. SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/config.yml +294 -0
  18. SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/dataparser_transforms.json +23 -0
  19. SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/nerfstudio_models/step-000480000.ckpt +3 -0
  20. SoundSpaces/apartment_2_NeRAF/.DS_Store +0 -0
  21. SoundSpaces/apartment_2_NeRAF/NeRAF/.DS_Store +0 -0
  22. SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/.DS_Store +0 -0
  23. SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/config.yml +294 -0
  24. SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/dataparser_transforms.json +23 -0
  25. SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/nerfstudio_models/step-000150000.ckpt +3 -0
  26. SoundSpaces/frl_apartment_2_NeRAF/.DS_Store +0 -0
  27. SoundSpaces/frl_apartment_2_NeRAF/NeRAF/.DS_Store +0 -0
  28. SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/.DS_Store +0 -0
  29. SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/config.yml +294 -0
  30. SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/dataparser_transforms.json +23 -0
  31. SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/nerfstudio_models/step-000450000.ckpt +3 -0
  32. SoundSpaces/frl_apartment_4_NeRAF/.DS_Store +0 -0
  33. SoundSpaces/frl_apartment_4_NeRAF/NeRAF/.DS_Store +0 -0
  34. SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/.DS_Store +0 -0
  35. SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/config.yml +294 -0
  36. SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/dataparser_transforms.json +23 -0
  37. SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/nerfstudio_models/step-000170000.ckpt +3 -0
  38. SoundSpaces/office_4_NeRAF/.DS_Store +0 -0
  39. SoundSpaces/office_4_NeRAF/NeRAF/.DS_Store +0 -0
  40. SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/.DS_Store +0 -0
  41. SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/config.yml +294 -0
  42. SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/dataparser_transforms.json +23 -0
  43. SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/nerfstudio_models/step-000460000.ckpt +3 -0
  44. SoundSpaces/room_2_NeRAF/.DS_Store +0 -0
  45. SoundSpaces/room_2_NeRAF/NeRAF/.DS_Store +0 -0
  46. SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/.DS_Store +0 -0
  47. SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/config.yml +294 -0
  48. SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/dataparser_transforms.json +23 -0
  49. SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/nerfstudio_models/step-000160000.ckpt +3 -0
RAF/EmptyRoom_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
RAF/EmptyRoom_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/.DS_Store ADDED
Binary file (6.15 kB). View file
 
RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/config.yml ADDED
@@ -0,0 +1,295 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - RAF
7
+ - EmptyRoom
8
+ experiment_name: EmptyRoom_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 300001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ./
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.RAFDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.RAFDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.RAFDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.RAFDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 48000
119
+ hop_len: 256
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 0.32
123
+ test_mode: test
124
+ train_num_rays_per_batch: 2048
125
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
126
+ N_features: 1024
127
+ N_freq_stft: 257
128
+ W_field: 512
129
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
130
+ collider_params:
131
+ far_plane: 6.0
132
+ near_plane: 2.0
133
+ criterion: SC+SLMSE
134
+ dataset: RAF
135
+ enable_collider: true
136
+ eval_num_rays_per_chunk: 4096
137
+ fs: 48000
138
+ grid_step: 0.0078125
139
+ hop_len: 128
140
+ loss_coefficients:
141
+ rgb_loss_coarse: 1.0
142
+ rgb_loss_fine: 1.0
143
+ loss_factor: 0.001
144
+ max_len: 0.32
145
+ prompt: null
146
+ use_grid: true
147
+ use_multiple_viewing_directions: true
148
+ win_len: 512
149
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
150
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
151
+ camera_optimizer: null
152
+ camera_res_scale_factor: 1.0
153
+ collate_fn: *id003
154
+ data: *id004
155
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
156
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
157
+ auto_scale_poses: true
158
+ center_method: poses
159
+ data: !!python/object/apply:pathlib.PosixPath []
160
+ depth_unit_scale_factor: 0.001
161
+ downscale_factor: null
162
+ eval_interval: 8
163
+ eval_mode: fraction
164
+ load_3D_points: false
165
+ mask_color: null
166
+ orientation_method: up
167
+ scale_factor: 1.0
168
+ scene_scale: 1.0
169
+ train_split_fraction: 0.9
170
+ eval_image_indices: !!python/tuple
171
+ - 0
172
+ eval_num_images_to_sample_from: -1
173
+ eval_num_rays_per_batch: 4096
174
+ eval_num_times_to_repeat_images: -1
175
+ images_on_gpu: true
176
+ masks_on_gpu: true
177
+ max_thread_workers: null
178
+ num_processes: 1
179
+ patch_size: 1
180
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
181
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
182
+ fisheye_crop_radius: null
183
+ ignore_mask: false
184
+ is_equirectangular: false
185
+ keep_full_image: false
186
+ max_num_iterations: 100
187
+ num_rays_per_batch: 4096
188
+ rejection_sample_mask: true
189
+ queue_size: 2
190
+ train_num_images_to_sample_from: -1
191
+ train_num_rays_per_batch: 4096
192
+ train_num_times_to_repeat_images: -1
193
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
194
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
195
+ collider_params:
196
+ far_plane: 6.0
197
+ near_plane: 2.0
198
+ enable_collider: true
199
+ eval_num_rays_per_chunk: 4096
200
+ loss_coefficients:
201
+ rgb_loss_coarse: 1.0
202
+ rgb_loss_fine: 1.0
203
+ prompt: null
204
+ save_eval_audio_path: null
205
+ start_step_audio: 2000
206
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
207
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
208
+ appearance_embed_dim: 32
209
+ average_init_density: 0.01
210
+ background_color: last_sample
211
+ base_res: 16
212
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
213
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
214
+ mode: SO3xR3
215
+ optimizer: null
216
+ rot_l2_penalty: 0.001
217
+ scheduler: null
218
+ trans_l2_penalty: 0.01
219
+ collider_params:
220
+ far_plane: 6.0
221
+ near_plane: 2.0
222
+ disable_scene_contraction: false
223
+ distortion_loss_mult: 0.002
224
+ enable_collider: true
225
+ eval_num_rays_per_chunk: 32768
226
+ far_plane: 1000.0
227
+ features_per_level: 2
228
+ hidden_dim: 64
229
+ hidden_dim_color: 64
230
+ hidden_dim_transient: 64
231
+ implementation: tcnn
232
+ interlevel_loss_mult: 1.0
233
+ log2_hashmap_size: 19
234
+ loss_coefficients:
235
+ rgb_loss_coarse: 1.0
236
+ rgb_loss_fine: 1.0
237
+ max_res: 2048
238
+ near_plane: 0.05
239
+ num_levels: 16
240
+ num_nerf_samples_per_ray: 48
241
+ num_proposal_iterations: 2
242
+ num_proposal_samples_per_ray: !!python/tuple
243
+ - 256
244
+ - 96
245
+ orientation_loss_mult: 0.0001
246
+ pred_normal_loss_mult: 0.001
247
+ predict_normals: false
248
+ prompt: null
249
+ proposal_initial_sampler: piecewise
250
+ proposal_net_args_list:
251
+ - hidden_dim: 16
252
+ log2_hashmap_size: 17
253
+ max_res: 128
254
+ num_levels: 5
255
+ use_linear: false
256
+ - hidden_dim: 16
257
+ log2_hashmap_size: 17
258
+ max_res: 256
259
+ num_levels: 5
260
+ use_linear: false
261
+ proposal_update_every: 5
262
+ proposal_warmup: 5000
263
+ proposal_weights_anneal_max_num_iters: 1000
264
+ proposal_weights_anneal_slope: 10.0
265
+ use_appearance_embedding: true
266
+ use_average_appearance_embedding: true
267
+ use_gradient_scaling: false
268
+ use_proposal_weight_anneal: true
269
+ use_same_proposal_network: false
270
+ use_single_jitter: true
271
+ project_name: nerfstudio-project
272
+ prompt: null
273
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
274
+ - nerfstudio_models
275
+ save_only_latest_checkpoint: false
276
+ steps_per_eval_all_images: 10000
277
+ steps_per_eval_batch: 10000
278
+ steps_per_eval_image: 10000
279
+ steps_per_save: 10000
280
+ timestamp: 2024-10-10_041356
281
+ use_grad_scaler: false
282
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
283
+ camera_frustum_scale: 0.1
284
+ default_composite_depth: true
285
+ image_format: jpeg
286
+ jpeg_quality: 75
287
+ make_share_url: false
288
+ max_num_display_images: 512
289
+ num_rays_per_chunk: 32768
290
+ quit_on_train_completion: false
291
+ relative_log_filename: viewer_log_filename.txt
292
+ websocket_host: 0.0.0.0
293
+ websocket_port: null
294
+ websocket_port_default: 7007
295
+ vis: tensorboard
RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 0.9952307343482971,
5
+ -0.002114448929205537,
6
+ 0.09752625972032547,
7
+ 10.1349458694458
8
+ ],
9
+ [
10
+ -0.002114448929205537,
11
+ 0.9990625381469727,
12
+ 0.04323790222406387,
13
+ 3.0788350105285645
14
+ ],
15
+ [
16
+ -0.09752625972032547,
17
+ -0.04323790222406387,
18
+ 0.9942932724952698,
19
+ -0.6873995065689087
20
+ ]
21
+ ],
22
+ "scale": 0.05830662043845625
23
+ }
RAF/EmptyRoom_NeRAF/NeRAF/2024-10-10_041356/nerfstudio_models/step-000090000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:990aedc1d456a4f3e6ffecaafe47c5cfd85a2bbd1d9f259ef84fc126c1cb9fb5
3
+ size 783247931
RAF/FurnishedRoom_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
RAF/FurnishedRoom_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/.DS_Store ADDED
Binary file (6.15 kB). View file
 
RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/config.yml ADDED
@@ -0,0 +1,295 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - RAF
7
+ - FurnishedRoom
8
+ experiment_name: FurnishedRoom_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 300001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ./
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.RAFDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.RAFDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.RAFDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.RAFDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 48000
119
+ hop_len: 256
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 0.32
123
+ test_mode: test
124
+ train_num_rays_per_batch: 2048
125
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
126
+ N_features: 1024
127
+ N_freq_stft: 257
128
+ W_field: 512
129
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
130
+ collider_params:
131
+ far_plane: 6.0
132
+ near_plane: 2.0
133
+ criterion: SC+SLMSE
134
+ dataset: RAF
135
+ enable_collider: true
136
+ eval_num_rays_per_chunk: 4096
137
+ fs: 48000
138
+ grid_step: 0.0078125
139
+ hop_len: 128
140
+ loss_coefficients:
141
+ rgb_loss_coarse: 1.0
142
+ rgb_loss_fine: 1.0
143
+ loss_factor: 0.001
144
+ max_len: 0.32
145
+ prompt: null
146
+ use_grid: true
147
+ use_multiple_viewing_directions: true
148
+ win_len: 512
149
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
150
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
151
+ camera_optimizer: null
152
+ camera_res_scale_factor: 1.0
153
+ collate_fn: *id003
154
+ data: *id004
155
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
156
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
157
+ auto_scale_poses: true
158
+ center_method: poses
159
+ data: !!python/object/apply:pathlib.PosixPath []
160
+ depth_unit_scale_factor: 0.001
161
+ downscale_factor: null
162
+ eval_interval: 8
163
+ eval_mode: fraction
164
+ load_3D_points: false
165
+ mask_color: null
166
+ orientation_method: up
167
+ scale_factor: 1.0
168
+ scene_scale: 1.0
169
+ train_split_fraction: 0.9
170
+ eval_image_indices: !!python/tuple
171
+ - 0
172
+ eval_num_images_to_sample_from: -1
173
+ eval_num_rays_per_batch: 4096
174
+ eval_num_times_to_repeat_images: -1
175
+ images_on_gpu: true
176
+ masks_on_gpu: true
177
+ max_thread_workers: null
178
+ num_processes: 1
179
+ patch_size: 1
180
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
181
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
182
+ fisheye_crop_radius: null
183
+ ignore_mask: false
184
+ is_equirectangular: false
185
+ keep_full_image: false
186
+ max_num_iterations: 100
187
+ num_rays_per_batch: 4096
188
+ rejection_sample_mask: true
189
+ queue_size: 2
190
+ train_num_images_to_sample_from: -1
191
+ train_num_rays_per_batch: 4096
192
+ train_num_times_to_repeat_images: -1
193
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
194
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
195
+ collider_params:
196
+ far_plane: 6.0
197
+ near_plane: 2.0
198
+ enable_collider: true
199
+ eval_num_rays_per_chunk: 4096
200
+ loss_coefficients:
201
+ rgb_loss_coarse: 1.0
202
+ rgb_loss_fine: 1.0
203
+ prompt: null
204
+ save_eval_audio_path: null
205
+ start_step_audio: 2000
206
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
207
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
208
+ appearance_embed_dim: 32
209
+ average_init_density: 0.01
210
+ background_color: last_sample
211
+ base_res: 16
212
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
213
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
214
+ mode: SO3xR3
215
+ optimizer: null
216
+ rot_l2_penalty: 0.001
217
+ scheduler: null
218
+ trans_l2_penalty: 0.01
219
+ collider_params:
220
+ far_plane: 6.0
221
+ near_plane: 2.0
222
+ disable_scene_contraction: false
223
+ distortion_loss_mult: 0.002
224
+ enable_collider: true
225
+ eval_num_rays_per_chunk: 32768
226
+ far_plane: 1000.0
227
+ features_per_level: 2
228
+ hidden_dim: 64
229
+ hidden_dim_color: 64
230
+ hidden_dim_transient: 64
231
+ implementation: tcnn
232
+ interlevel_loss_mult: 1.0
233
+ log2_hashmap_size: 19
234
+ loss_coefficients:
235
+ rgb_loss_coarse: 1.0
236
+ rgb_loss_fine: 1.0
237
+ max_res: 2048
238
+ near_plane: 0.05
239
+ num_levels: 16
240
+ num_nerf_samples_per_ray: 48
241
+ num_proposal_iterations: 2
242
+ num_proposal_samples_per_ray: !!python/tuple
243
+ - 256
244
+ - 96
245
+ orientation_loss_mult: 0.0001
246
+ pred_normal_loss_mult: 0.001
247
+ predict_normals: false
248
+ prompt: null
249
+ proposal_initial_sampler: piecewise
250
+ proposal_net_args_list:
251
+ - hidden_dim: 16
252
+ log2_hashmap_size: 17
253
+ max_res: 128
254
+ num_levels: 5
255
+ use_linear: false
256
+ - hidden_dim: 16
257
+ log2_hashmap_size: 17
258
+ max_res: 256
259
+ num_levels: 5
260
+ use_linear: false
261
+ proposal_update_every: 5
262
+ proposal_warmup: 5000
263
+ proposal_weights_anneal_max_num_iters: 1000
264
+ proposal_weights_anneal_slope: 10.0
265
+ use_appearance_embedding: true
266
+ use_average_appearance_embedding: true
267
+ use_gradient_scaling: false
268
+ use_proposal_weight_anneal: true
269
+ use_same_proposal_network: false
270
+ use_single_jitter: true
271
+ project_name: nerfstudio-project
272
+ prompt: null
273
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
274
+ - nerfstudio_models
275
+ save_only_latest_checkpoint: false
276
+ steps_per_eval_all_images: 10000
277
+ steps_per_eval_batch: 10000
278
+ steps_per_eval_image: 10000
279
+ steps_per_save: 10000
280
+ timestamp: 2024-10-08_091734
281
+ use_grad_scaler: false
282
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
283
+ camera_frustum_scale: 0.1
284
+ default_composite_depth: true
285
+ image_format: jpeg
286
+ jpeg_quality: 75
287
+ make_share_url: false
288
+ max_num_display_images: 512
289
+ num_rays_per_chunk: 32768
290
+ quit_on_train_completion: false
291
+ relative_log_filename: viewer_log_filename.txt
292
+ websocket_host: 0.0.0.0
293
+ websocket_port: null
294
+ websocket_port_default: 7007
295
+ vis: tensorboard
RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 0.9999954104423523,
5
+ -2.209847116318997e-05,
6
+ 0.0030350869055837393,
7
+ 0.9352688193321228
8
+ ],
9
+ [
10
+ -2.209847116318997e-05,
11
+ 0.9998939633369446,
12
+ 0.01456119678914547,
13
+ 4.980982780456543
14
+ ],
15
+ [
16
+ -0.0030350869055837393,
17
+ -0.01456119678914547,
18
+ 0.9998893737792969,
19
+ 0.0385591983795166
20
+ ]
21
+ ],
22
+ "scale": 0.1115622692578588
23
+ }
RAF/FurnishedRoom_NeRAF/NeRAF/2024-10-08_091734/nerfstudio_models/step-000070000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93c9a728c4051e826799d2ee156f9ec53d69f4288427c31882b4b61a602be227
3
+ size 782844283
README.md CHANGED
@@ -1,3 +1,40 @@
1
  ---
2
  license: cc-by-nc-sa-4.0
 
 
 
 
 
 
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: cc-by-nc-sa-4.0
3
+ tags:
4
+ - audio-visual-learning
5
+ - neural-radiance-fields
6
+ - neural-acoustic-fields
7
+ - spatial-audio
8
+ - nerfstudio
9
+ - pytorch
10
+ datasets:
11
+ - RAF
12
+ - SoundSpaces
13
  ---
14
+
15
+ Official pretrained model weights for NeRAF from the paper: **"NeRAF: 3D Scene Infused Neural Radiance and Acoustic Fields"** (ICLR 2025).
16
+
17
+ This repository contains pretrained checkpoints for RAF dataset and 6 SoundSpaces scenes.
18
+
19
+ For training, evaluation, and usage instructions please see the official codebase:
20
+ 👉 https://github.com/AmandineBtto/NeRAF
21
+
22
+
23
+ You can download all weights using:
24
+
25
+ ```bash
26
+ huggingface-cli download AmandineBtto/NeRAF --local-dir weights/NeRAF
27
+ ```
28
+
29
+ If you use these weights, please cite:
30
+
31
+ ```
32
+ @inproceedings{
33
+ brunetto2025neraf,
34
+ title={Ne{RAF}: 3D Scene Infused Neural Radiance and Acoustic Fields},
35
+ author={Amandine Brunetto and Sascha Hornauer and Fabien Moutarde},
36
+ booktitle={The Thirteenth International Conference on Learning Representations},
37
+ year={2025},
38
+ url={https://openreview.net/forum?id=njvSBvtiwp}
39
+ }
40
+ ```
SoundSpaces/apartment_1_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/apartment_1_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/config.yml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - SoundSpaces
7
+ - apartment_1
8
+ experiment_name: apartment_1_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 500001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ../
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.SoundSpacesDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.SoundSpacesDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.SoundSpacesDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.SoundSpacesDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 22050
119
+ hop_len: 128
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 101
123
+ train_num_rays_per_batch: 2048
124
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
125
+ N_features: 2048
126
+ N_freq_stft: 257
127
+ W_field: 512
128
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
129
+ collider_params:
130
+ far_plane: 6.0
131
+ near_plane: 2.0
132
+ criterion: SC+SLMSE
133
+ dataset: SoundSpaces
134
+ enable_collider: true
135
+ eval_num_rays_per_chunk: 4096
136
+ fs: 22050
137
+ grid_step: 0.0078125
138
+ hop_len: 128
139
+ loss_coefficients:
140
+ rgb_loss_coarse: 1.0
141
+ rgb_loss_fine: 1.0
142
+ loss_factor: 0.001
143
+ max_len: 101
144
+ prompt: null
145
+ use_grid: true
146
+ use_multiple_viewing_directions: true
147
+ win_len: 512
148
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
149
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
150
+ camera_optimizer: null
151
+ camera_res_scale_factor: 1.0
152
+ collate_fn: *id003
153
+ data: *id004
154
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
155
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
156
+ auto_scale_poses: true
157
+ center_method: poses
158
+ data: !!python/object/apply:pathlib.PosixPath []
159
+ depth_unit_scale_factor: 0.001
160
+ downscale_factor: null
161
+ eval_interval: 8
162
+ eval_mode: filename
163
+ load_3D_points: false
164
+ mask_color: null
165
+ orientation_method: up
166
+ scale_factor: 1.0
167
+ scene_scale: 1.0
168
+ train_split_fraction: 0.9
169
+ eval_image_indices: !!python/tuple
170
+ - 0
171
+ eval_num_images_to_sample_from: -1
172
+ eval_num_rays_per_batch: 4096
173
+ eval_num_times_to_repeat_images: -1
174
+ images_on_gpu: true
175
+ masks_on_gpu: true
176
+ max_thread_workers: null
177
+ num_processes: 1
178
+ patch_size: 1
179
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
180
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
181
+ fisheye_crop_radius: null
182
+ ignore_mask: false
183
+ is_equirectangular: false
184
+ keep_full_image: false
185
+ max_num_iterations: 100
186
+ num_rays_per_batch: 4096
187
+ rejection_sample_mask: true
188
+ queue_size: 2
189
+ train_num_images_to_sample_from: -1
190
+ train_num_rays_per_batch: 4096
191
+ train_num_times_to_repeat_images: -1
192
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
193
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
194
+ collider_params:
195
+ far_plane: 6.0
196
+ near_plane: 2.0
197
+ enable_collider: true
198
+ eval_num_rays_per_chunk: 4096
199
+ loss_coefficients:
200
+ rgb_loss_coarse: 1.0
201
+ rgb_loss_fine: 1.0
202
+ prompt: null
203
+ save_eval_audio_path: null
204
+ start_step_audio: 2000
205
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
206
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
207
+ appearance_embed_dim: 32
208
+ average_init_density: 0.01
209
+ background_color: last_sample
210
+ base_res: 16
211
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
212
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
213
+ mode: SO3xR3
214
+ optimizer: null
215
+ rot_l2_penalty: 0.001
216
+ scheduler: null
217
+ trans_l2_penalty: 0.01
218
+ collider_params:
219
+ far_plane: 6.0
220
+ near_plane: 2.0
221
+ disable_scene_contraction: false
222
+ distortion_loss_mult: 0.002
223
+ enable_collider: true
224
+ eval_num_rays_per_chunk: 32768
225
+ far_plane: 1000.0
226
+ features_per_level: 2
227
+ hidden_dim: 64
228
+ hidden_dim_color: 64
229
+ hidden_dim_transient: 64
230
+ implementation: tcnn
231
+ interlevel_loss_mult: 1.0
232
+ log2_hashmap_size: 19
233
+ loss_coefficients:
234
+ rgb_loss_coarse: 1.0
235
+ rgb_loss_fine: 1.0
236
+ max_res: 2048
237
+ near_plane: 0.05
238
+ num_levels: 16
239
+ num_nerf_samples_per_ray: 48
240
+ num_proposal_iterations: 2
241
+ num_proposal_samples_per_ray: !!python/tuple
242
+ - 256
243
+ - 96
244
+ orientation_loss_mult: 0.0001
245
+ pred_normal_loss_mult: 0.001
246
+ predict_normals: false
247
+ prompt: null
248
+ proposal_initial_sampler: piecewise
249
+ proposal_net_args_list:
250
+ - hidden_dim: 16
251
+ log2_hashmap_size: 17
252
+ max_res: 128
253
+ num_levels: 5
254
+ use_linear: false
255
+ - hidden_dim: 16
256
+ log2_hashmap_size: 17
257
+ max_res: 256
258
+ num_levels: 5
259
+ use_linear: false
260
+ proposal_update_every: 5
261
+ proposal_warmup: 5000
262
+ proposal_weights_anneal_max_num_iters: 1000
263
+ proposal_weights_anneal_slope: 10.0
264
+ use_appearance_embedding: true
265
+ use_average_appearance_embedding: true
266
+ use_gradient_scaling: false
267
+ use_proposal_weight_anneal: true
268
+ use_same_proposal_network: false
269
+ use_single_jitter: true
270
+ project_name: nerfstudio-project
271
+ prompt: null
272
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
273
+ - nerfstudio_models
274
+ save_only_latest_checkpoint: false
275
+ steps_per_eval_all_images: 10000
276
+ steps_per_eval_batch: 10000
277
+ steps_per_eval_image: 10000
278
+ steps_per_save: 10000
279
+ timestamp: 2024-10-18_093105
280
+ use_grad_scaler: false
281
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
282
+ camera_frustum_scale: 0.1
283
+ default_composite_depth: true
284
+ image_format: jpeg
285
+ jpeg_quality: 75
286
+ make_share_url: false
287
+ max_num_display_images: 512
288
+ num_rays_per_chunk: 32768
289
+ quit_on_train_completion: false
290
+ relative_log_filename: viewer_log_filename.txt
291
+ websocket_host: 0.0.0.0
292
+ websocket_port: null
293
+ websocket_port_default: 7007
294
+ vis: tensorboard
SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 1.0,
5
+ 0.0,
6
+ 0.0,
7
+ 3.3542232513427734
8
+ ],
9
+ [
10
+ 0.0,
11
+ 1.0,
12
+ 0.0,
13
+ 3.233105182647705
14
+ ],
15
+ [
16
+ 0.0,
17
+ 0.0,
18
+ 1.0,
19
+ 1.7497400045394897
20
+ ]
21
+ ],
22
+ "scale": 0.1816968860606569
23
+ }
SoundSpaces/apartment_1_NeRAF/NeRAF/2024-10-18_093105/nerfstudio_models/step-000480000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a79809688f6e10992404e5174090d0165cc0107c369a05dd3693f7e1de9a0dd3
3
+ size 1195042065
SoundSpaces/apartment_2_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/apartment_2_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/config.yml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - SoundSpaces
7
+ - apartment_2
8
+ experiment_name: apartment_2_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 500001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ../
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.SoundSpacesDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.SoundSpacesDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.SoundSpacesDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.SoundSpacesDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 22050
119
+ hop_len: 128
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 86
123
+ train_num_rays_per_batch: 2048
124
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
125
+ N_features: 1024
126
+ N_freq_stft: 257
127
+ W_field: 512
128
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
129
+ collider_params:
130
+ far_plane: 6.0
131
+ near_plane: 2.0
132
+ criterion: SC+SLMSE
133
+ dataset: SoundSpaces
134
+ enable_collider: true
135
+ eval_num_rays_per_chunk: 4096
136
+ fs: 22050
137
+ grid_step: 0.0078125
138
+ hop_len: 128
139
+ loss_coefficients:
140
+ rgb_loss_coarse: 1.0
141
+ rgb_loss_fine: 1.0
142
+ loss_factor: 0.001
143
+ max_len: 86
144
+ prompt: null
145
+ use_grid: true
146
+ use_multiple_viewing_directions: true
147
+ win_len: 512
148
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
149
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
150
+ camera_optimizer: null
151
+ camera_res_scale_factor: 1.0
152
+ collate_fn: *id003
153
+ data: *id004
154
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
155
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
156
+ auto_scale_poses: true
157
+ center_method: poses
158
+ data: !!python/object/apply:pathlib.PosixPath []
159
+ depth_unit_scale_factor: 0.001
160
+ downscale_factor: null
161
+ eval_interval: 8
162
+ eval_mode: filename
163
+ load_3D_points: false
164
+ mask_color: null
165
+ orientation_method: up
166
+ scale_factor: 1.0
167
+ scene_scale: 1.0
168
+ train_split_fraction: 0.9
169
+ eval_image_indices: !!python/tuple
170
+ - 0
171
+ eval_num_images_to_sample_from: -1
172
+ eval_num_rays_per_batch: 4096
173
+ eval_num_times_to_repeat_images: -1
174
+ images_on_gpu: true
175
+ masks_on_gpu: true
176
+ max_thread_workers: null
177
+ num_processes: 1
178
+ patch_size: 1
179
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
180
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
181
+ fisheye_crop_radius: null
182
+ ignore_mask: false
183
+ is_equirectangular: false
184
+ keep_full_image: false
185
+ max_num_iterations: 100
186
+ num_rays_per_batch: 4096
187
+ rejection_sample_mask: true
188
+ queue_size: 2
189
+ train_num_images_to_sample_from: -1
190
+ train_num_rays_per_batch: 4096
191
+ train_num_times_to_repeat_images: -1
192
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
193
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
194
+ collider_params:
195
+ far_plane: 6.0
196
+ near_plane: 2.0
197
+ enable_collider: true
198
+ eval_num_rays_per_chunk: 4096
199
+ loss_coefficients:
200
+ rgb_loss_coarse: 1.0
201
+ rgb_loss_fine: 1.0
202
+ prompt: null
203
+ save_eval_audio_path: null
204
+ start_step_audio: 2000
205
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
206
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
207
+ appearance_embed_dim: 32
208
+ average_init_density: 0.01
209
+ background_color: last_sample
210
+ base_res: 16
211
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
212
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
213
+ mode: SO3xR3
214
+ optimizer: null
215
+ rot_l2_penalty: 0.001
216
+ scheduler: null
217
+ trans_l2_penalty: 0.01
218
+ collider_params:
219
+ far_plane: 6.0
220
+ near_plane: 2.0
221
+ disable_scene_contraction: false
222
+ distortion_loss_mult: 0.002
223
+ enable_collider: true
224
+ eval_num_rays_per_chunk: 32768
225
+ far_plane: 1000.0
226
+ features_per_level: 2
227
+ hidden_dim: 64
228
+ hidden_dim_color: 64
229
+ hidden_dim_transient: 64
230
+ implementation: tcnn
231
+ interlevel_loss_mult: 1.0
232
+ log2_hashmap_size: 19
233
+ loss_coefficients:
234
+ rgb_loss_coarse: 1.0
235
+ rgb_loss_fine: 1.0
236
+ max_res: 2048
237
+ near_plane: 0.05
238
+ num_levels: 16
239
+ num_nerf_samples_per_ray: 48
240
+ num_proposal_iterations: 2
241
+ num_proposal_samples_per_ray: !!python/tuple
242
+ - 256
243
+ - 96
244
+ orientation_loss_mult: 0.0001
245
+ pred_normal_loss_mult: 0.001
246
+ predict_normals: false
247
+ prompt: null
248
+ proposal_initial_sampler: piecewise
249
+ proposal_net_args_list:
250
+ - hidden_dim: 16
251
+ log2_hashmap_size: 17
252
+ max_res: 128
253
+ num_levels: 5
254
+ use_linear: false
255
+ - hidden_dim: 16
256
+ log2_hashmap_size: 17
257
+ max_res: 256
258
+ num_levels: 5
259
+ use_linear: false
260
+ proposal_update_every: 5
261
+ proposal_warmup: 5000
262
+ proposal_weights_anneal_max_num_iters: 1000
263
+ proposal_weights_anneal_slope: 10.0
264
+ use_appearance_embedding: true
265
+ use_average_appearance_embedding: true
266
+ use_gradient_scaling: false
267
+ use_proposal_weight_anneal: true
268
+ use_same_proposal_network: false
269
+ use_single_jitter: true
270
+ project_name: nerfstudio-project
271
+ prompt: null
272
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
273
+ - nerfstudio_models
274
+ save_only_latest_checkpoint: false
275
+ steps_per_eval_all_images: 10000
276
+ steps_per_eval_batch: 10000
277
+ steps_per_eval_image: 10000
278
+ steps_per_save: 10000
279
+ timestamp: 2024-10-13_131052
280
+ use_grad_scaler: false
281
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
282
+ camera_frustum_scale: 0.1
283
+ default_composite_depth: true
284
+ image_format: jpeg
285
+ jpeg_quality: 75
286
+ make_share_url: false
287
+ max_num_display_images: 512
288
+ num_rays_per_chunk: 32768
289
+ quit_on_train_completion: false
290
+ relative_log_filename: viewer_log_filename.txt
291
+ websocket_host: 0.0.0.0
292
+ websocket_port: null
293
+ websocket_port_default: 7007
294
+ vis: tensorboard
SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 1.0,
5
+ 0.0,
6
+ 0.0,
7
+ 2.539200782775879
8
+ ],
9
+ [
10
+ 0.0,
11
+ 1.0,
12
+ 0.0,
13
+ 3.0175981521606445
14
+ ],
15
+ [
16
+ 0.0,
17
+ 0.0,
18
+ 1.0,
19
+ 1.6110721826553345
20
+ ]
21
+ ],
22
+ "scale": 0.1954609374883496
23
+ }
SoundSpaces/apartment_2_NeRAF/NeRAF/2024-10-13_131052/nerfstudio_models/step-000150000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af1e65265dfba186c644b4054f6faf664d79badd6e4405356ed5f555362a0c99
3
+ size 782825379
SoundSpaces/frl_apartment_2_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/frl_apartment_2_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/config.yml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - SoundSpaces
7
+ - frl_apartment_2
8
+ experiment_name: frl_apartment_2_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 500001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ../
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.SoundSpacesDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.SoundSpacesDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.SoundSpacesDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.SoundSpacesDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 22050
119
+ hop_len: 128
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 107
123
+ train_num_rays_per_batch: 2048
124
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
125
+ N_features: 2048
126
+ N_freq_stft: 257
127
+ W_field: 512
128
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
129
+ collider_params:
130
+ far_plane: 6.0
131
+ near_plane: 2.0
132
+ criterion: SC+SLMSE
133
+ dataset: SoundSpaces
134
+ enable_collider: true
135
+ eval_num_rays_per_chunk: 4096
136
+ fs: 22050
137
+ grid_step: 0.0078125
138
+ hop_len: 128
139
+ loss_coefficients:
140
+ rgb_loss_coarse: 1.0
141
+ rgb_loss_fine: 1.0
142
+ loss_factor: 0.001
143
+ max_len: 107
144
+ prompt: null
145
+ use_grid: true
146
+ use_multiple_viewing_directions: true
147
+ win_len: 512
148
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
149
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
150
+ camera_optimizer: null
151
+ camera_res_scale_factor: 1.0
152
+ collate_fn: *id003
153
+ data: *id004
154
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
155
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
156
+ auto_scale_poses: true
157
+ center_method: poses
158
+ data: !!python/object/apply:pathlib.PosixPath []
159
+ depth_unit_scale_factor: 0.001
160
+ downscale_factor: null
161
+ eval_interval: 8
162
+ eval_mode: filename
163
+ load_3D_points: false
164
+ mask_color: null
165
+ orientation_method: up
166
+ scale_factor: 1.0
167
+ scene_scale: 1.0
168
+ train_split_fraction: 0.9
169
+ eval_image_indices: !!python/tuple
170
+ - 0
171
+ eval_num_images_to_sample_from: -1
172
+ eval_num_rays_per_batch: 4096
173
+ eval_num_times_to_repeat_images: -1
174
+ images_on_gpu: true
175
+ masks_on_gpu: true
176
+ max_thread_workers: null
177
+ num_processes: 1
178
+ patch_size: 1
179
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
180
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
181
+ fisheye_crop_radius: null
182
+ ignore_mask: false
183
+ is_equirectangular: false
184
+ keep_full_image: false
185
+ max_num_iterations: 100
186
+ num_rays_per_batch: 4096
187
+ rejection_sample_mask: true
188
+ queue_size: 2
189
+ train_num_images_to_sample_from: -1
190
+ train_num_rays_per_batch: 4096
191
+ train_num_times_to_repeat_images: -1
192
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
193
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
194
+ collider_params:
195
+ far_plane: 6.0
196
+ near_plane: 2.0
197
+ enable_collider: true
198
+ eval_num_rays_per_chunk: 4096
199
+ loss_coefficients:
200
+ rgb_loss_coarse: 1.0
201
+ rgb_loss_fine: 1.0
202
+ prompt: null
203
+ save_eval_audio_path: null
204
+ start_step_audio: 2000
205
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
206
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
207
+ appearance_embed_dim: 32
208
+ average_init_density: 0.01
209
+ background_color: last_sample
210
+ base_res: 16
211
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
212
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
213
+ mode: SO3xR3
214
+ optimizer: null
215
+ rot_l2_penalty: 0.001
216
+ scheduler: null
217
+ trans_l2_penalty: 0.01
218
+ collider_params:
219
+ far_plane: 6.0
220
+ near_plane: 2.0
221
+ disable_scene_contraction: false
222
+ distortion_loss_mult: 0.002
223
+ enable_collider: true
224
+ eval_num_rays_per_chunk: 32768
225
+ far_plane: 1000.0
226
+ features_per_level: 2
227
+ hidden_dim: 64
228
+ hidden_dim_color: 64
229
+ hidden_dim_transient: 64
230
+ implementation: tcnn
231
+ interlevel_loss_mult: 1.0
232
+ log2_hashmap_size: 19
233
+ loss_coefficients:
234
+ rgb_loss_coarse: 1.0
235
+ rgb_loss_fine: 1.0
236
+ max_res: 2048
237
+ near_plane: 0.05
238
+ num_levels: 16
239
+ num_nerf_samples_per_ray: 48
240
+ num_proposal_iterations: 2
241
+ num_proposal_samples_per_ray: !!python/tuple
242
+ - 256
243
+ - 96
244
+ orientation_loss_mult: 0.0001
245
+ pred_normal_loss_mult: 0.001
246
+ predict_normals: false
247
+ prompt: null
248
+ proposal_initial_sampler: piecewise
249
+ proposal_net_args_list:
250
+ - hidden_dim: 16
251
+ log2_hashmap_size: 17
252
+ max_res: 128
253
+ num_levels: 5
254
+ use_linear: false
255
+ - hidden_dim: 16
256
+ log2_hashmap_size: 17
257
+ max_res: 256
258
+ num_levels: 5
259
+ use_linear: false
260
+ proposal_update_every: 5
261
+ proposal_warmup: 5000
262
+ proposal_weights_anneal_max_num_iters: 1000
263
+ proposal_weights_anneal_slope: 10.0
264
+ use_appearance_embedding: true
265
+ use_average_appearance_embedding: true
266
+ use_gradient_scaling: false
267
+ use_proposal_weight_anneal: true
268
+ use_same_proposal_network: false
269
+ use_single_jitter: true
270
+ project_name: nerfstudio-project
271
+ prompt: null
272
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
273
+ - nerfstudio_models
274
+ save_only_latest_checkpoint: false
275
+ steps_per_eval_all_images: 10000
276
+ steps_per_eval_batch: 10000
277
+ steps_per_eval_image: 10000
278
+ steps_per_save: 10000
279
+ timestamp: 2024-10-18_133400
280
+ use_grad_scaler: false
281
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
282
+ camera_frustum_scale: 0.1
283
+ default_composite_depth: true
284
+ image_format: jpeg
285
+ jpeg_quality: 75
286
+ make_share_url: false
287
+ max_num_display_images: 512
288
+ num_rays_per_chunk: 32768
289
+ quit_on_train_completion: false
290
+ relative_log_filename: viewer_log_filename.txt
291
+ websocket_host: 0.0.0.0
292
+ websocket_port: null
293
+ websocket_port_default: 7007
294
+ vis: tensorboard
SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 1.0,
5
+ 0.0,
6
+ 0.0,
7
+ 2.636273145675659
8
+ ],
9
+ [
10
+ 0.0,
11
+ 1.0,
12
+ 0.0,
13
+ 1.7466418743133545
14
+ ],
15
+ [
16
+ 0.0,
17
+ 0.0,
18
+ 1.0,
19
+ 1.4013906717300415
20
+ ]
21
+ ],
22
+ "scale": 0.18044055968484302
23
+ }
SoundSpaces/frl_apartment_2_NeRAF/NeRAF/2024-10-18_133400/nerfstudio_models/step-000450000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6724db0d8f9e72b48c43f2fa575840eba9c9b44eb6b357df3745dedf3eea4b96
3
+ size 1194988689
SoundSpaces/frl_apartment_4_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/frl_apartment_4_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/config.yml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - SoundSpaces
7
+ - frl_apartment_4
8
+ experiment_name: frl_apartment_4_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 500001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ../
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.SoundSpacesDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.SoundSpacesDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.SoundSpacesDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.SoundSpacesDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 22050
119
+ hop_len: 128
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 103
123
+ train_num_rays_per_batch: 2048
124
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
125
+ N_features: 2048
126
+ N_freq_stft: 257
127
+ W_field: 512
128
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
129
+ collider_params:
130
+ far_plane: 6.0
131
+ near_plane: 2.0
132
+ criterion: SC+SLMSE
133
+ dataset: SoundSpaces
134
+ enable_collider: true
135
+ eval_num_rays_per_chunk: 4096
136
+ fs: 22050
137
+ grid_step: 0.0078125
138
+ hop_len: 128
139
+ loss_coefficients:
140
+ rgb_loss_coarse: 1.0
141
+ rgb_loss_fine: 1.0
142
+ loss_factor: 0.001
143
+ max_len: 103
144
+ prompt: null
145
+ use_grid: true
146
+ use_multiple_viewing_directions: true
147
+ win_len: 512
148
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
149
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
150
+ camera_optimizer: null
151
+ camera_res_scale_factor: 1.0
152
+ collate_fn: *id003
153
+ data: *id004
154
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
155
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
156
+ auto_scale_poses: true
157
+ center_method: poses
158
+ data: !!python/object/apply:pathlib.PosixPath []
159
+ depth_unit_scale_factor: 0.001
160
+ downscale_factor: null
161
+ eval_interval: 8
162
+ eval_mode: filename
163
+ load_3D_points: false
164
+ mask_color: null
165
+ orientation_method: up
166
+ scale_factor: 1.0
167
+ scene_scale: 1.0
168
+ train_split_fraction: 0.9
169
+ eval_image_indices: !!python/tuple
170
+ - 0
171
+ eval_num_images_to_sample_from: -1
172
+ eval_num_rays_per_batch: 4096
173
+ eval_num_times_to_repeat_images: -1
174
+ images_on_gpu: true
175
+ masks_on_gpu: true
176
+ max_thread_workers: null
177
+ num_processes: 1
178
+ patch_size: 1
179
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
180
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
181
+ fisheye_crop_radius: null
182
+ ignore_mask: false
183
+ is_equirectangular: false
184
+ keep_full_image: false
185
+ max_num_iterations: 100
186
+ num_rays_per_batch: 4096
187
+ rejection_sample_mask: true
188
+ queue_size: 2
189
+ train_num_images_to_sample_from: -1
190
+ train_num_rays_per_batch: 4096
191
+ train_num_times_to_repeat_images: -1
192
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
193
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
194
+ collider_params:
195
+ far_plane: 6.0
196
+ near_plane: 2.0
197
+ enable_collider: true
198
+ eval_num_rays_per_chunk: 4096
199
+ loss_coefficients:
200
+ rgb_loss_coarse: 1.0
201
+ rgb_loss_fine: 1.0
202
+ prompt: null
203
+ save_eval_audio_path: null
204
+ start_step_audio: 2000
205
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
206
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
207
+ appearance_embed_dim: 32
208
+ average_init_density: 0.01
209
+ background_color: last_sample
210
+ base_res: 16
211
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
212
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
213
+ mode: SO3xR3
214
+ optimizer: null
215
+ rot_l2_penalty: 0.001
216
+ scheduler: null
217
+ trans_l2_penalty: 0.01
218
+ collider_params:
219
+ far_plane: 6.0
220
+ near_plane: 2.0
221
+ disable_scene_contraction: false
222
+ distortion_loss_mult: 0.002
223
+ enable_collider: true
224
+ eval_num_rays_per_chunk: 32768
225
+ far_plane: 1000.0
226
+ features_per_level: 2
227
+ hidden_dim: 64
228
+ hidden_dim_color: 64
229
+ hidden_dim_transient: 64
230
+ implementation: tcnn
231
+ interlevel_loss_mult: 1.0
232
+ log2_hashmap_size: 19
233
+ loss_coefficients:
234
+ rgb_loss_coarse: 1.0
235
+ rgb_loss_fine: 1.0
236
+ max_res: 2048
237
+ near_plane: 0.05
238
+ num_levels: 16
239
+ num_nerf_samples_per_ray: 48
240
+ num_proposal_iterations: 2
241
+ num_proposal_samples_per_ray: !!python/tuple
242
+ - 256
243
+ - 96
244
+ orientation_loss_mult: 0.0001
245
+ pred_normal_loss_mult: 0.001
246
+ predict_normals: false
247
+ prompt: null
248
+ proposal_initial_sampler: piecewise
249
+ proposal_net_args_list:
250
+ - hidden_dim: 16
251
+ log2_hashmap_size: 17
252
+ max_res: 128
253
+ num_levels: 5
254
+ use_linear: false
255
+ - hidden_dim: 16
256
+ log2_hashmap_size: 17
257
+ max_res: 256
258
+ num_levels: 5
259
+ use_linear: false
260
+ proposal_update_every: 5
261
+ proposal_warmup: 5000
262
+ proposal_weights_anneal_max_num_iters: 1000
263
+ proposal_weights_anneal_slope: 10.0
264
+ use_appearance_embedding: true
265
+ use_average_appearance_embedding: true
266
+ use_gradient_scaling: false
267
+ use_proposal_weight_anneal: true
268
+ use_same_proposal_network: false
269
+ use_single_jitter: true
270
+ project_name: nerfstudio-project
271
+ prompt: null
272
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
273
+ - nerfstudio_models
274
+ save_only_latest_checkpoint: false
275
+ steps_per_eval_all_images: 10000
276
+ steps_per_eval_batch: 10000
277
+ steps_per_eval_image: 10000
278
+ steps_per_save: 10000
279
+ timestamp: 2024-10-20_105001
280
+ use_grad_scaler: false
281
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
282
+ camera_frustum_scale: 0.1
283
+ default_composite_depth: true
284
+ image_format: jpeg
285
+ jpeg_quality: 75
286
+ make_share_url: false
287
+ max_num_display_images: 512
288
+ num_rays_per_chunk: 32768
289
+ quit_on_train_completion: false
290
+ relative_log_filename: viewer_log_filename.txt
291
+ websocket_host: 0.0.0.0
292
+ websocket_port: null
293
+ websocket_port_default: 7007
294
+ vis: tensorboard
SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 1.0,
5
+ 0.0,
6
+ 0.0,
7
+ 2.6369545459747314
8
+ ],
9
+ [
10
+ 0.0,
11
+ 1.0,
12
+ 0.0,
13
+ -2.6249184608459473
14
+ ],
15
+ [
16
+ 0.0,
17
+ 0.0,
18
+ 1.0,
19
+ 1.451151728630066
20
+ ]
21
+ ],
22
+ "scale": 0.18359158603929643
23
+ }
SoundSpaces/frl_apartment_4_NeRAF/NeRAF/2024-10-20_105001/nerfstudio_models/step-000170000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:040c2a17899a01ba911ee70eb37b644c43bcbec08a993376e3b5c92fee422223
3
+ size 1194988689
SoundSpaces/office_4_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/office_4_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/config.yml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - SoundSpaces
7
+ - office_4
8
+ experiment_name: office_4_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 500001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ../
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.SoundSpacesDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.SoundSpacesDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.SoundSpacesDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.SoundSpacesDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 22050
119
+ hop_len: 128
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 78
123
+ train_num_rays_per_batch: 2048
124
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
125
+ N_features: 1024
126
+ N_freq_stft: 257
127
+ W_field: 512
128
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
129
+ collider_params:
130
+ far_plane: 6.0
131
+ near_plane: 2.0
132
+ criterion: SC+SLMSE
133
+ dataset: SoundSpaces
134
+ enable_collider: true
135
+ eval_num_rays_per_chunk: 4096
136
+ fs: 22050
137
+ grid_step: 0.0078125
138
+ hop_len: 128
139
+ loss_coefficients:
140
+ rgb_loss_coarse: 1.0
141
+ rgb_loss_fine: 1.0
142
+ loss_factor: 0.001
143
+ max_len: 78
144
+ prompt: null
145
+ use_grid: true
146
+ use_multiple_viewing_directions: true
147
+ win_len: 512
148
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
149
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
150
+ camera_optimizer: null
151
+ camera_res_scale_factor: 1.0
152
+ collate_fn: *id003
153
+ data: *id004
154
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
155
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
156
+ auto_scale_poses: true
157
+ center_method: poses
158
+ data: !!python/object/apply:pathlib.PosixPath []
159
+ depth_unit_scale_factor: 0.001
160
+ downscale_factor: null
161
+ eval_interval: 8
162
+ eval_mode: filename
163
+ load_3D_points: false
164
+ mask_color: null
165
+ orientation_method: up
166
+ scale_factor: 1.0
167
+ scene_scale: 1.0
168
+ train_split_fraction: 0.9
169
+ eval_image_indices: !!python/tuple
170
+ - 0
171
+ eval_num_images_to_sample_from: -1
172
+ eval_num_rays_per_batch: 4096
173
+ eval_num_times_to_repeat_images: -1
174
+ images_on_gpu: true
175
+ masks_on_gpu: true
176
+ max_thread_workers: null
177
+ num_processes: 1
178
+ patch_size: 1
179
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
180
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
181
+ fisheye_crop_radius: null
182
+ ignore_mask: false
183
+ is_equirectangular: false
184
+ keep_full_image: false
185
+ max_num_iterations: 100
186
+ num_rays_per_batch: 4096
187
+ rejection_sample_mask: true
188
+ queue_size: 2
189
+ train_num_images_to_sample_from: -1
190
+ train_num_rays_per_batch: 4096
191
+ train_num_times_to_repeat_images: -1
192
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
193
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
194
+ collider_params:
195
+ far_plane: 6.0
196
+ near_plane: 2.0
197
+ enable_collider: true
198
+ eval_num_rays_per_chunk: 4096
199
+ loss_coefficients:
200
+ rgb_loss_coarse: 1.0
201
+ rgb_loss_fine: 1.0
202
+ prompt: null
203
+ save_eval_audio_path: null
204
+ start_step_audio: 2000
205
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
206
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
207
+ appearance_embed_dim: 32
208
+ average_init_density: 0.01
209
+ background_color: last_sample
210
+ base_res: 16
211
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
212
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
213
+ mode: SO3xR3
214
+ optimizer: null
215
+ rot_l2_penalty: 0.001
216
+ scheduler: null
217
+ trans_l2_penalty: 0.01
218
+ collider_params:
219
+ far_plane: 6.0
220
+ near_plane: 2.0
221
+ disable_scene_contraction: false
222
+ distortion_loss_mult: 0.002
223
+ enable_collider: true
224
+ eval_num_rays_per_chunk: 32768
225
+ far_plane: 1000.0
226
+ features_per_level: 2
227
+ hidden_dim: 64
228
+ hidden_dim_color: 64
229
+ hidden_dim_transient: 64
230
+ implementation: tcnn
231
+ interlevel_loss_mult: 1.0
232
+ log2_hashmap_size: 19
233
+ loss_coefficients:
234
+ rgb_loss_coarse: 1.0
235
+ rgb_loss_fine: 1.0
236
+ max_res: 2048
237
+ near_plane: 0.05
238
+ num_levels: 16
239
+ num_nerf_samples_per_ray: 48
240
+ num_proposal_iterations: 2
241
+ num_proposal_samples_per_ray: !!python/tuple
242
+ - 256
243
+ - 96
244
+ orientation_loss_mult: 0.0001
245
+ pred_normal_loss_mult: 0.001
246
+ predict_normals: false
247
+ prompt: null
248
+ proposal_initial_sampler: piecewise
249
+ proposal_net_args_list:
250
+ - hidden_dim: 16
251
+ log2_hashmap_size: 17
252
+ max_res: 128
253
+ num_levels: 5
254
+ use_linear: false
255
+ - hidden_dim: 16
256
+ log2_hashmap_size: 17
257
+ max_res: 256
258
+ num_levels: 5
259
+ use_linear: false
260
+ proposal_update_every: 5
261
+ proposal_warmup: 5000
262
+ proposal_weights_anneal_max_num_iters: 1000
263
+ proposal_weights_anneal_slope: 10.0
264
+ use_appearance_embedding: true
265
+ use_average_appearance_embedding: true
266
+ use_gradient_scaling: false
267
+ use_proposal_weight_anneal: true
268
+ use_same_proposal_network: false
269
+ use_single_jitter: true
270
+ project_name: nerfstudio-project
271
+ prompt: null
272
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
273
+ - nerfstudio_models
274
+ save_only_latest_checkpoint: false
275
+ steps_per_eval_all_images: 10000
276
+ steps_per_eval_batch: 10000
277
+ steps_per_eval_image: 10000
278
+ steps_per_save: 10000
279
+ timestamp: 2024-10-11_101120
280
+ use_grad_scaler: false
281
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
282
+ camera_frustum_scale: 0.1
283
+ default_composite_depth: true
284
+ image_format: jpeg
285
+ jpeg_quality: 75
286
+ make_share_url: false
287
+ max_num_display_images: 512
288
+ num_rays_per_chunk: 32768
289
+ quit_on_train_completion: false
290
+ relative_log_filename: viewer_log_filename.txt
291
+ websocket_host: 0.0.0.0
292
+ websocket_port: null
293
+ websocket_port_default: 7007
294
+ vis: tensorboard
SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 1.0,
5
+ 0.0,
6
+ 0.0,
7
+ 2.089837074279785
8
+ ],
9
+ [
10
+ 0.0,
11
+ 1.0,
12
+ 0.0,
13
+ 1.5238884687423706
14
+ ],
15
+ [
16
+ 0.0,
17
+ 0.0,
18
+ 1.0,
19
+ 1.1040260791778564
20
+ ]
21
+ ],
22
+ "scale": 0.36437187805494425
23
+ }
SoundSpaces/office_4_NeRAF/NeRAF/2024-10-11_101120/nerfstudio_models/step-000460000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6de3e2336f43dbee1b93ab77094e6b7b883fb229aec1738d1ed29eaed4eab82b
3
+ size 782750627
SoundSpaces/room_2_NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/room_2_NeRAF/NeRAF/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/.DS_Store ADDED
Binary file (6.15 kB). View file
 
SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/config.yml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:nerfstudio.engine.trainer.TrainerConfig
2
+ _target: !!python/name:nerfstudio.engine.trainer.Trainer ''
3
+ data: &id004 !!python/object/apply:pathlib.PosixPath
4
+ - ../
5
+ - data
6
+ - SoundSpaces
7
+ - room_2
8
+ experiment_name: room_2_NeRAF
9
+ gradient_accumulation_steps: {}
10
+ load_checkpoint: null
11
+ load_config: null
12
+ load_dir: null
13
+ load_scheduler: true
14
+ load_step: null
15
+ log_gradients: false
16
+ logging: !!python/object:nerfstudio.configs.base_config.LoggingConfig
17
+ local_writer: !!python/object:nerfstudio.configs.base_config.LocalWriterConfig
18
+ _target: !!python/name:nerfstudio.utils.writer.LocalWriter ''
19
+ enable: true
20
+ max_log_size: 10
21
+ stats_to_track: !!python/tuple
22
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
23
+ - Train Iter (time)
24
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
25
+ - Train Rays / Sec
26
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
27
+ - Test PSNR
28
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
29
+ - Vis Rays / Sec
30
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
31
+ - Test Rays / Sec
32
+ - !!python/object/apply:nerfstudio.utils.writer.EventName
33
+ - ETA (time)
34
+ max_buffer_size: 20
35
+ profiler: basic
36
+ relative_log_dir: !!python/object/apply:pathlib.PosixPath []
37
+ steps_per_log: 10
38
+ machine: !!python/object:nerfstudio.configs.base_config.MachineConfig
39
+ device_type: cuda
40
+ dist_url: auto
41
+ machine_rank: 0
42
+ num_devices: 1
43
+ num_machines: 1
44
+ seed: 42
45
+ max_num_iterations: 500001
46
+ method_name: NeRAF
47
+ mixed_precision: true
48
+ optimizers:
49
+ audio_fields:
50
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
51
+ _target: &id001 !!python/name:torch.optim.adam.Adam ''
52
+ eps: 1.0e-15
53
+ lr: 0.0001
54
+ max_norm: null
55
+ weight_decay: 0
56
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
57
+ _target: &id002 !!python/name:nerfstudio.engine.schedulers.ExponentialDecayScheduler ''
58
+ lr_final: 1.0e-08
59
+ lr_pre_warmup: 1.0e-08
60
+ max_steps: 1002000
61
+ ramp: cosine
62
+ warmup_steps: 2000
63
+ camera_opt:
64
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
65
+ _target: *id001
66
+ eps: 1.0e-15
67
+ lr: 0.001
68
+ max_norm: null
69
+ weight_decay: 0
70
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
71
+ _target: *id002
72
+ lr_final: 0.0001
73
+ lr_pre_warmup: 1.0e-08
74
+ max_steps: 5000
75
+ ramp: cosine
76
+ warmup_steps: 0
77
+ fields:
78
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
79
+ _target: *id001
80
+ eps: 1.0e-15
81
+ lr: 0.01
82
+ max_norm: null
83
+ weight_decay: 0
84
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
85
+ _target: *id002
86
+ lr_final: 0.0001
87
+ lr_pre_warmup: 1.0e-08
88
+ max_steps: 200000
89
+ ramp: cosine
90
+ warmup_steps: 0
91
+ proposal_networks:
92
+ optimizer: !!python/object:nerfstudio.engine.optimizers.AdamOptimizerConfig
93
+ _target: *id001
94
+ eps: 1.0e-15
95
+ lr: 0.01
96
+ max_norm: null
97
+ weight_decay: 0
98
+ scheduler: !!python/object:nerfstudio.engine.schedulers.ExponentialDecaySchedulerConfig
99
+ _target: *id002
100
+ lr_final: 0.0001
101
+ lr_pre_warmup: 1.0e-08
102
+ max_steps: 200000
103
+ ramp: cosine
104
+ warmup_steps: 0
105
+ output_dir: !!python/object/apply:pathlib.PosixPath
106
+ - ../
107
+ - outputs
108
+ pipeline: !!python/object:NeRAF.NeRAF_pipeline.NeRAFPipelineConfig
109
+ _target: !!python/name:NeRAF.NeRAF_pipeline.NeRAFPipeline ''
110
+ audio_datamanager: !!python/object:NeRAF.NeRAF_datamanager.SoundSpacesDataManagerConfig
111
+ _target: !!python/name:NeRAF.NeRAF_datamanager.SoundSpacesDataManager ''
112
+ collate_fn: &id003 !!python/name:nerfstudio.data.utils.nerfstudio_collate.nerfstudio_collate ''
113
+ data: null
114
+ dataparser: !!python/object:NeRAF.NeRAF_dataparser.SoundSpacesDataParserConfig
115
+ _target: !!python/name:NeRAF.NeRAF_dataparser.SoundSpacesDataParser ''
116
+ data: !!python/object/apply:pathlib.PosixPath []
117
+ eval_num_rays_per_batch: 2048
118
+ fs: 22050
119
+ hop_len: 128
120
+ images_on_gpu: false
121
+ masks_on_gpu: false
122
+ max_len: 84
123
+ train_num_rays_per_batch: 2048
124
+ audio_model: !!python/object:NeRAF.NeRAF_model.NeRAFAudioModelConfig
125
+ N_features: 1024
126
+ N_freq_stft: 257
127
+ W_field: 512
128
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFAudioModel ''
129
+ collider_params:
130
+ far_plane: 6.0
131
+ near_plane: 2.0
132
+ criterion: SC+SLMSE
133
+ dataset: SoundSpaces
134
+ enable_collider: true
135
+ eval_num_rays_per_chunk: 4096
136
+ fs: 22050
137
+ grid_step: 0.0078125
138
+ hop_len: 128
139
+ loss_coefficients:
140
+ rgb_loss_coarse: 1.0
141
+ rgb_loss_fine: 1.0
142
+ loss_factor: 0.001
143
+ max_len: 84
144
+ prompt: null
145
+ use_grid: true
146
+ use_multiple_viewing_directions: true
147
+ win_len: 512
148
+ datamanager: !!python/object:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManagerConfig
149
+ _target: !!python/name:nerfstudio.data.datamanagers.parallel_datamanager.ParallelDataManager ''
150
+ camera_optimizer: null
151
+ camera_res_scale_factor: 1.0
152
+ collate_fn: *id003
153
+ data: *id004
154
+ dataparser: !!python/object:nerfstudio.data.dataparsers.nerfstudio_dataparser.NerfstudioDataParserConfig
155
+ _target: !!python/name:nerfstudio.data.dataparsers.nerfstudio_dataparser.Nerfstudio ''
156
+ auto_scale_poses: true
157
+ center_method: poses
158
+ data: !!python/object/apply:pathlib.PosixPath []
159
+ depth_unit_scale_factor: 0.001
160
+ downscale_factor: null
161
+ eval_interval: 8
162
+ eval_mode: filename
163
+ load_3D_points: false
164
+ mask_color: null
165
+ orientation_method: up
166
+ scale_factor: 1.0
167
+ scene_scale: 1.0
168
+ train_split_fraction: 0.9
169
+ eval_image_indices: !!python/tuple
170
+ - 0
171
+ eval_num_images_to_sample_from: -1
172
+ eval_num_rays_per_batch: 4096
173
+ eval_num_times_to_repeat_images: -1
174
+ images_on_gpu: true
175
+ masks_on_gpu: true
176
+ max_thread_workers: null
177
+ num_processes: 1
178
+ patch_size: 1
179
+ pixel_sampler: !!python/object:nerfstudio.data.pixel_samplers.PixelSamplerConfig
180
+ _target: !!python/name:nerfstudio.data.pixel_samplers.PixelSampler ''
181
+ fisheye_crop_radius: null
182
+ ignore_mask: false
183
+ is_equirectangular: false
184
+ keep_full_image: false
185
+ max_num_iterations: 100
186
+ num_rays_per_batch: 4096
187
+ rejection_sample_mask: true
188
+ queue_size: 2
189
+ train_num_images_to_sample_from: -1
190
+ train_num_rays_per_batch: 4096
191
+ train_num_times_to_repeat_images: -1
192
+ model: !!python/object:nerfstudio.models.base_model.ModelConfig
193
+ _target: !!python/name:nerfstudio.models.base_model.Model ''
194
+ collider_params:
195
+ far_plane: 6.0
196
+ near_plane: 2.0
197
+ enable_collider: true
198
+ eval_num_rays_per_chunk: 4096
199
+ loss_coefficients:
200
+ rgb_loss_coarse: 1.0
201
+ rgb_loss_fine: 1.0
202
+ prompt: null
203
+ save_eval_audio_path: null
204
+ start_step_audio: 2000
205
+ vision_model: !!python/object:NeRAF.NeRAF_model.NeRAFVisionModelConfig
206
+ _target: !!python/name:NeRAF.NeRAF_model.NeRAFVisionModel ''
207
+ appearance_embed_dim: 32
208
+ average_init_density: 0.01
209
+ background_color: last_sample
210
+ base_res: 16
211
+ camera_optimizer: !!python/object:nerfstudio.cameras.camera_optimizers.CameraOptimizerConfig
212
+ _target: !!python/name:nerfstudio.cameras.camera_optimizers.CameraOptimizer ''
213
+ mode: SO3xR3
214
+ optimizer: null
215
+ rot_l2_penalty: 0.001
216
+ scheduler: null
217
+ trans_l2_penalty: 0.01
218
+ collider_params:
219
+ far_plane: 6.0
220
+ near_plane: 2.0
221
+ disable_scene_contraction: false
222
+ distortion_loss_mult: 0.002
223
+ enable_collider: true
224
+ eval_num_rays_per_chunk: 32768
225
+ far_plane: 1000.0
226
+ features_per_level: 2
227
+ hidden_dim: 64
228
+ hidden_dim_color: 64
229
+ hidden_dim_transient: 64
230
+ implementation: tcnn
231
+ interlevel_loss_mult: 1.0
232
+ log2_hashmap_size: 19
233
+ loss_coefficients:
234
+ rgb_loss_coarse: 1.0
235
+ rgb_loss_fine: 1.0
236
+ max_res: 2048
237
+ near_plane: 0.05
238
+ num_levels: 16
239
+ num_nerf_samples_per_ray: 48
240
+ num_proposal_iterations: 2
241
+ num_proposal_samples_per_ray: !!python/tuple
242
+ - 256
243
+ - 96
244
+ orientation_loss_mult: 0.0001
245
+ pred_normal_loss_mult: 0.001
246
+ predict_normals: false
247
+ prompt: null
248
+ proposal_initial_sampler: piecewise
249
+ proposal_net_args_list:
250
+ - hidden_dim: 16
251
+ log2_hashmap_size: 17
252
+ max_res: 128
253
+ num_levels: 5
254
+ use_linear: false
255
+ - hidden_dim: 16
256
+ log2_hashmap_size: 17
257
+ max_res: 256
258
+ num_levels: 5
259
+ use_linear: false
260
+ proposal_update_every: 5
261
+ proposal_warmup: 5000
262
+ proposal_weights_anneal_max_num_iters: 1000
263
+ proposal_weights_anneal_slope: 10.0
264
+ use_appearance_embedding: true
265
+ use_average_appearance_embedding: true
266
+ use_gradient_scaling: false
267
+ use_proposal_weight_anneal: true
268
+ use_same_proposal_network: false
269
+ use_single_jitter: true
270
+ project_name: nerfstudio-project
271
+ prompt: null
272
+ relative_model_dir: !!python/object/apply:pathlib.PosixPath
273
+ - nerfstudio_models
274
+ save_only_latest_checkpoint: false
275
+ steps_per_eval_all_images: 10000
276
+ steps_per_eval_batch: 10000
277
+ steps_per_eval_image: 10000
278
+ steps_per_save: 10000
279
+ timestamp: 2024-10-14_045651
280
+ use_grad_scaler: false
281
+ viewer: !!python/object:nerfstudio.configs.base_config.ViewerConfig
282
+ camera_frustum_scale: 0.1
283
+ default_composite_depth: true
284
+ image_format: jpeg
285
+ jpeg_quality: 75
286
+ make_share_url: false
287
+ max_num_display_images: 512
288
+ num_rays_per_chunk: 32768
289
+ quit_on_train_completion: false
290
+ relative_log_filename: viewer_log_filename.txt
291
+ websocket_host: 0.0.0.0
292
+ websocket_port: null
293
+ websocket_port_default: 7007
294
+ vis: tensorboard
SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/dataparser_transforms.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "transform": [
3
+ [
4
+ 1.0,
5
+ 0.0,
6
+ 0.0,
7
+ 2.031975269317627
8
+ ],
9
+ [
10
+ 0.0,
11
+ 1.0,
12
+ 0.0,
13
+ -0.7323977947235107
14
+ ],
15
+ [
16
+ 0.0,
17
+ 0.0,
18
+ 1.0,
19
+ 2.499042510986328
20
+ ]
21
+ ],
22
+ "scale": 0.3277654238635945
23
+ }
SoundSpaces/room_2_NeRAF/NeRAF/2024-10-14_045651/nerfstudio_models/step-000160000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64ea2d345cf504f531885609c19644e63a7314ad7be57dd764600564c8e8d658
3
+ size 782750627