| data_workers: 10 |
| name: Walrus_ft_flowbench_FPO_NS_2D_512x128_skelenton_realglobalnorm-flowb-delta-Isotr[Space-Adapt-Space-FullA-Axial]-AdamW-0.0001 |
| finetune: true |
| automatic_setup: true |
| trainer: |
| _target_: walrus.trainer.Trainer |
| max_epoch: 50 |
| val_frequency: 5 |
| rollout_val_frequency: 5 |
| short_validation_length: 20 |
| max_rollout_steps: 200 |
| num_time_intervals: 5 |
| enable_amp: false |
| loss_fn: |
| _target_: the_well.benchmark.metrics.MAE |
| formatter: |
| _target_: hydra.utils.get_class |
| path: walrus.data.well_to_multi_transformer.ChannelsFirstWithTimeFormatter |
| revin: |
| _target_: walrus.trainer.normalization_strat.GlobalRevNormalization |
| _partial_: true |
| prediction_type: delta |
| grad_acc_steps: 1 |
| image_validation: true |
| video_validation: true |
| gradient_log_level: 0 |
| clip_gradient: 10 |
| log_interval: 200 |
| loss_multiplier: 100.0 |
| lr_scheduler_per_step: false |
| skip_spectral_metrics: true |
| optimizer: |
| _target_: torch.optim.AdamW |
| lr: 0.0001 |
| weight_decay: 0.0001 |
| eps: 1.0e-10 |
| lr_scheduler: |
| _target_: walrus.optim.schedulers.InverseSqrtLinearWarmupSqrtCooldown |
| warmup_epochs: 10 |
| cooldown_epochs: 10 |
| warmup_lr_factor: 0.1 |
| cooldown_lr_factor: 0.001 |
| model: |
| encoder: |
| _partial_: true |
| _target_: walrus.models.encoders.vstride_encoder.SpaceBagAdaptiveDVstrideEncoder |
| learned_pad: true |
| base_kernel_size1d: |
| - - 4 |
| - 4 |
| base_kernel_size2d: |
| - - 8 |
| - 4 |
| - - 8 |
| - 4 |
| base_kernel_size3d: |
| - - 8 |
| - 4 |
| - - 8 |
| - 4 |
| - - 8 |
| - 4 |
| groups: 12 |
| kernel_scales_seq: |
| - - 2 |
| - 2 |
| - - 4 |
| - 2 |
| - - 4 |
| - 4 |
| - - 8 |
| - 4 |
| variable_downsample: true |
| variable_deterministic_ds: true |
| activation: |
| _partial_: true |
| _target_: torch.nn.SiLU |
| decoder: |
| _partial_: true |
| _target_: walrus.models.decoders.vstride_decoder.AdaptiveDVstrideDecoder |
| learned_pad: true |
| base_kernel_size1d: |
| - - 4 |
| - 4 |
| base_kernel_size2d: |
| - - 8 |
| - 4 |
| - - 8 |
| - 4 |
| base_kernel_size3d: |
| - - 8 |
| - 4 |
| - - 8 |
| - 4 |
| - - 8 |
| - 4 |
| groups: 12 |
| activation: |
| _partial_: true |
| _target_: torch.nn.SiLU |
| processor: |
| space_mixing: |
| _partial_: true |
| _target_: walrus.models.spatial_blocks.full_attention.FullAttention |
| num_heads: 16 |
| mlp_dim: null |
| time_mixing: |
| _partial_: true |
| _target_: walrus.models.temporal_blocks.axial_time_attention.AxialTimeAttention |
| num_heads: 16 |
| bias_type: rel |
| channel_mixing: |
| _partial_: true |
| _target_: torch.nn.Identity |
| _partial_: true |
| _target_: walrus.models.spatiotemporal_blocks.space_time_split.SpaceTimeSplitBlock |
| norm_layer: |
| _partial_: true |
| _target_: walrus.models.shared_utils.normalization.RMSGroupNorm |
| _target_: walrus.models.IsotropicModel |
| hidden_dim: 1408 |
| projection_dim: 48 |
| intermediate_dim: 352 |
| processor_blocks: 40 |
| drop_path: 0.0 |
| groups: 16 |
| max_d: 3 |
| static_axes: true |
| weight_tied_axes: false |
| causal_in_time: true |
| include_d: |
| - 2 |
| - 3 |
| override_dimensionality: 0 |
| jitter_patches: true |
| gradient_checkpointing_freq: 0 |
| use_periodic_fixed_jitter: true |
| input_field_drop: 0 |
| data: |
| field_index_map_override: |
| closed_boundary: 0 |
| open_boundary: 1 |
| bias_correction: 2 |
| pressure: 3 |
| velocity_x: 4 |
| velocity_y: 5 |
| velocity_z: 6 |
| zeros_like_density: 7 |
| speed_of_sound: 8 |
| concentration: 9 |
| D_xx: 10 |
| D_xy: 11 |
| D_xz: 12 |
| D_yx: 13 |
| D_yy: 14 |
| D_yz: 15 |
| D_zx: 16 |
| D_zy: 17 |
| D_zz: 18 |
| E_xx: 19 |
| E_xy: 20 |
| E_xz: 21 |
| E_yx: 22 |
| E_yy: 23 |
| E_yz: 24 |
| E_zx: 25 |
| E_zy: 26 |
| E_zz: 27 |
| density: 28 |
| energy: 29 |
| velocity_r: 30 |
| velocity_theta: 31 |
| velocity_phi: 32 |
| momentum_x: 33 |
| momentum_y: 34 |
| momentum_z: 35 |
| pressure_re: 36 |
| pressure_im: 37 |
| mask: 38 |
| magnetic_field_x: 39 |
| magnetic_field_y: 40 |
| magnetic_field_z: 41 |
| A: 42 |
| B: 43 |
| height: 44 |
| internal_energy: 45 |
| temperature: 46 |
| electron_fraction: 47 |
| entropy: 48 |
| magnetic_field_log_r: 49 |
| magnetic_field_theta: 50 |
| magnetic_field_phi: 51 |
| velocity_log_r: 52 |
| buoyancy: 53 |
| tracer: 54 |
| log10_density: 55 |
| log10_temperature: 56 |
| c_zz: 57 |
| C_xx: 58 |
| C_xy: 59 |
| C_xz: 60 |
| C_yx: 61 |
| C_yy: 62 |
| C_yz: 63 |
| C_zx: 64 |
| C_zy: 65 |
| C_zz: 66 |
| well_base_path: /mnt/gpuxl/polymathic/the_well/datasets/ |
| wandb_data_name: flowbench_FPO_NS_2D_512x128_skelenton |
| module_parameters: |
| _target_: walrus.data.MixedWellDataModule |
| batch_size: 1 |
| n_steps_input: 6 |
| n_steps_output: 1 |
| min_dt_stride: 1 |
| max_dt_stride: 1 |
| max_samples: 2000 |
| well_dataset_info: |
| flowbench_FPO_NS_2D_512x128_skelenton: |
| include_filters: [] |
| exclude_filters: [] |
| path: /mnt/home/polymathic/ceph/WellFormattedExternalData/flowbench/flowbench_FPO_NS_2D_512x128_skelenton/ |
| normalization_path: logged_stats.yaml |
| auto_resume: true |
| folder_override: '' |
| checkpoint_override: '' |
| config_override: /mnt/home/polymathic/ceph/walrus_logging/platinum_checkpoints/extended_config.yaml |
| validation_mode: false |
| frozen_components: |
| - model |
| distribution: |
| distribution_type: fsdp |
| local_size: null |
| logger: |
| wandb: true |
| wandb_project_name: walrus_Finetuning_Runs |
| checkpoint: |
| _target_: walrus.trainer.checkpoints.CheckPointer |
| save_dir: /mnt/home/polymathic/ceph/walrus_logging/runs/Walrus_ft_flowbench_FPO_NS_2D_512x128_skelenton_realglobalnorm-flowb-delta-Isotr[Space-Adapt-Space-FullA-Axial]-AdamW-0.0001/finetune/0/checkpoints |
| load_checkpoint_path: null |
| coalesced_checkpoint_path: /mnt/home/polymathic/ceph/walrus_logging/platinum_checkpoints/final_base_model/walrus.pt |
| save_best: true |
| checkpoint_frequency: 20 |
| finetuning_mods: |
| learnable_rope: true |
| rope_per_axis: true |
| ape_shape: |
| - 33 |
| - 33 |
| - 1 |
| experiment_dir: /mnt/home/polymathic/ceph/walrus_logging/runs |
|
|