Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000200.json +151 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000400.json +151 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000600.json +151 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000800.json +151 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_001000.json +151 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000200.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000400.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000600.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000800.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_001000.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank0.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank1.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank2.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank3.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank4.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank5.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank6.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank7.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank0.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank1.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank2.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank3.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank4.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank5.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank6.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank7.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank0.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank1.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank2.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank3.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank4.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank5.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank6.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank7.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank0.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank1.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank2.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank3.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank4.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank5.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank6.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank7.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank0.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank1.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank2.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank3.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank4.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank5.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank6.pt +3 -0
- fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank7.pt +3 -0
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000200.json
ADDED
|
@@ -0,0 +1,151 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 200,
|
| 3 |
+
"model_type": "fm_vit",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"embed_dim": 768,
|
| 6 |
+
"depth": 12,
|
| 7 |
+
"num_heads": 12,
|
| 8 |
+
"mlp_ratio": 4.0,
|
| 9 |
+
"dropout": 0.0,
|
| 10 |
+
"attn_dropout": 0.0,
|
| 11 |
+
"patch_size": 16,
|
| 12 |
+
"modalities": [
|
| 13 |
+
"sentinel2_l2a",
|
| 14 |
+
"sentinel1",
|
| 15 |
+
"landsat"
|
| 16 |
+
],
|
| 17 |
+
"modality_channels": {
|
| 18 |
+
"sentinel2_l2a": 12,
|
| 19 |
+
"sentinel1": 2,
|
| 20 |
+
"landsat": 11
|
| 21 |
+
}
|
| 22 |
+
},
|
| 23 |
+
"user_config": {
|
| 24 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 25 |
+
"s2_key": "sentinel2_l2a",
|
| 26 |
+
"s1_key": "sentinel1",
|
| 27 |
+
"landsat_key": "landsat",
|
| 28 |
+
"num_timesteps": 12,
|
| 29 |
+
"timestep_strategy": "uniform",
|
| 30 |
+
"patch_size": 16,
|
| 31 |
+
"mask_ratio": 0.75,
|
| 32 |
+
"s2_value_scale": 0.0001,
|
| 33 |
+
"s1_value_scale": 1.0,
|
| 34 |
+
"landsat_value_scale": 0.0001,
|
| 35 |
+
"norm": "computed",
|
| 36 |
+
"norm_stats_file": "",
|
| 37 |
+
"norm_std_multiplier": 2.0,
|
| 38 |
+
"num_workers": 32,
|
| 39 |
+
"prefetch": 64,
|
| 40 |
+
"shuffle_buffer": 2000,
|
| 41 |
+
"depth": 12,
|
| 42 |
+
"embed_dim": 768,
|
| 43 |
+
"num_heads": 12,
|
| 44 |
+
"mlp_ratio": 4.0,
|
| 45 |
+
"dropout": 0.0,
|
| 46 |
+
"attn_dropout": 0.0,
|
| 47 |
+
"contrastive_weight": 0.1,
|
| 48 |
+
"contrastive_temp": 0.1,
|
| 49 |
+
"contrastive_proj_dim": 256,
|
| 50 |
+
"contrastive_lr": 0.001,
|
| 51 |
+
"contrastive_queue_size": 4096,
|
| 52 |
+
"contrastive_pooling": "mean_unmasked",
|
| 53 |
+
"spatial_aug": "flip_rotate",
|
| 54 |
+
"drop_s1_p": 0.3,
|
| 55 |
+
"drop_landsat_p": 0.3,
|
| 56 |
+
"distill_weight": 1.0,
|
| 57 |
+
"distill_every": 1,
|
| 58 |
+
"distill_teacher_patch_size": 4,
|
| 59 |
+
"distill_teacher_expected_hw": 64,
|
| 60 |
+
"distill_teacher_timesteps": 1,
|
| 61 |
+
"distill_olmoearth_src_dir": "/workspace/Spatial/olmoearth_pretrain",
|
| 62 |
+
"distill_olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 63 |
+
"distill_olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth",
|
| 64 |
+
"run": "dummy",
|
| 65 |
+
"device_type": "",
|
| 66 |
+
"num_iterations": 2000,
|
| 67 |
+
"device_batch_size": 2,
|
| 68 |
+
"grad_accum_steps": 8,
|
| 69 |
+
"lr": 0.0001,
|
| 70 |
+
"weight_decay": 0.05,
|
| 71 |
+
"adam_beta1": 0.9,
|
| 72 |
+
"adam_beta2": 0.95,
|
| 73 |
+
"warmup_ratio": 0.01,
|
| 74 |
+
"warmdown_ratio": 0.4,
|
| 75 |
+
"final_lr_frac": 0.0,
|
| 76 |
+
"grad_clip": 1.0,
|
| 77 |
+
"resume_from_step": -1,
|
| 78 |
+
"init_from_model_tag": "fmvit_d12_e768_ps16_normcomputed_contrast",
|
| 79 |
+
"init_from_step": 2600,
|
| 80 |
+
"init_from_model_path": "",
|
| 81 |
+
"init_nonstrict": false,
|
| 82 |
+
"freeze_blocks": false,
|
| 83 |
+
"freeze_final_norm": false,
|
| 84 |
+
"freeze_recon_head": false,
|
| 85 |
+
"eval_every": 200,
|
| 86 |
+
"eval_steps": 25,
|
| 87 |
+
"save_every": 200,
|
| 88 |
+
"model_tag": "fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600"
|
| 89 |
+
},
|
| 90 |
+
"dataset_meta": {
|
| 91 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 92 |
+
"s2_key": "sentinel2_l2a",
|
| 93 |
+
"s1_key": "sentinel1",
|
| 94 |
+
"landsat_key": "landsat",
|
| 95 |
+
"num_timesteps": 12,
|
| 96 |
+
"timestep_strategy": "uniform",
|
| 97 |
+
"patch_size": 16,
|
| 98 |
+
"grid_size": 8,
|
| 99 |
+
"mask_ratio": 0.75,
|
| 100 |
+
"value_scales": {
|
| 101 |
+
"sentinel2_l2a": 0.0001,
|
| 102 |
+
"sentinel1": 1.0,
|
| 103 |
+
"landsat": 0.0001
|
| 104 |
+
},
|
| 105 |
+
"norm": {
|
| 106 |
+
"strategy": "computed",
|
| 107 |
+
"stats_file": "/workspace/Spatial/olmoearth_pretrain/olmoearth_pretrain/data/norm_configs/computed.json",
|
| 108 |
+
"std_multiplier": 2.0
|
| 109 |
+
},
|
| 110 |
+
"modalities": [
|
| 111 |
+
"sentinel2_l2a",
|
| 112 |
+
"sentinel1",
|
| 113 |
+
"landsat"
|
| 114 |
+
],
|
| 115 |
+
"modality_channels": {
|
| 116 |
+
"sentinel2_l2a": 12,
|
| 117 |
+
"sentinel1": 2,
|
| 118 |
+
"landsat": 11
|
| 119 |
+
},
|
| 120 |
+
"contrastive": {
|
| 121 |
+
"weight": 0.1,
|
| 122 |
+
"temp": 0.1,
|
| 123 |
+
"proj_dim": 256,
|
| 124 |
+
"queue_size": 4096,
|
| 125 |
+
"pooling": "mean_unmasked",
|
| 126 |
+
"spatial_aug": "flip_rotate",
|
| 127 |
+
"drop_s1_p": 0.3,
|
| 128 |
+
"drop_landsat_p": 0.3
|
| 129 |
+
},
|
| 130 |
+
"distill": {
|
| 131 |
+
"weight": 1.0,
|
| 132 |
+
"every": 1,
|
| 133 |
+
"teacher_patch_size": 4,
|
| 134 |
+
"teacher_expected_hw": 64,
|
| 135 |
+
"teacher_timesteps": 1,
|
| 136 |
+
"olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 137 |
+
"olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth"
|
| 138 |
+
}
|
| 139 |
+
},
|
| 140 |
+
"grad_accum_steps": 8,
|
| 141 |
+
"dataloader_state_dict": {
|
| 142 |
+
"epoch": 1,
|
| 143 |
+
"seen_in_epoch": 3559,
|
| 144 |
+
"rank": 0
|
| 145 |
+
},
|
| 146 |
+
"loop_state": {
|
| 147 |
+
"min_val_loss": 0.004307515919208527,
|
| 148 |
+
"smooth_train_loss": 0.5816326680596287,
|
| 149 |
+
"total_training_time": 1061.5331101417542
|
| 150 |
+
}
|
| 151 |
+
}
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000400.json
ADDED
|
@@ -0,0 +1,151 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 400,
|
| 3 |
+
"model_type": "fm_vit",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"embed_dim": 768,
|
| 6 |
+
"depth": 12,
|
| 7 |
+
"num_heads": 12,
|
| 8 |
+
"mlp_ratio": 4.0,
|
| 9 |
+
"dropout": 0.0,
|
| 10 |
+
"attn_dropout": 0.0,
|
| 11 |
+
"patch_size": 16,
|
| 12 |
+
"modalities": [
|
| 13 |
+
"sentinel2_l2a",
|
| 14 |
+
"sentinel1",
|
| 15 |
+
"landsat"
|
| 16 |
+
],
|
| 17 |
+
"modality_channels": {
|
| 18 |
+
"sentinel2_l2a": 12,
|
| 19 |
+
"sentinel1": 2,
|
| 20 |
+
"landsat": 11
|
| 21 |
+
}
|
| 22 |
+
},
|
| 23 |
+
"user_config": {
|
| 24 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 25 |
+
"s2_key": "sentinel2_l2a",
|
| 26 |
+
"s1_key": "sentinel1",
|
| 27 |
+
"landsat_key": "landsat",
|
| 28 |
+
"num_timesteps": 12,
|
| 29 |
+
"timestep_strategy": "uniform",
|
| 30 |
+
"patch_size": 16,
|
| 31 |
+
"mask_ratio": 0.75,
|
| 32 |
+
"s2_value_scale": 0.0001,
|
| 33 |
+
"s1_value_scale": 1.0,
|
| 34 |
+
"landsat_value_scale": 0.0001,
|
| 35 |
+
"norm": "computed",
|
| 36 |
+
"norm_stats_file": "",
|
| 37 |
+
"norm_std_multiplier": 2.0,
|
| 38 |
+
"num_workers": 32,
|
| 39 |
+
"prefetch": 64,
|
| 40 |
+
"shuffle_buffer": 2000,
|
| 41 |
+
"depth": 12,
|
| 42 |
+
"embed_dim": 768,
|
| 43 |
+
"num_heads": 12,
|
| 44 |
+
"mlp_ratio": 4.0,
|
| 45 |
+
"dropout": 0.0,
|
| 46 |
+
"attn_dropout": 0.0,
|
| 47 |
+
"contrastive_weight": 0.1,
|
| 48 |
+
"contrastive_temp": 0.1,
|
| 49 |
+
"contrastive_proj_dim": 256,
|
| 50 |
+
"contrastive_lr": 0.001,
|
| 51 |
+
"contrastive_queue_size": 4096,
|
| 52 |
+
"contrastive_pooling": "mean_unmasked",
|
| 53 |
+
"spatial_aug": "flip_rotate",
|
| 54 |
+
"drop_s1_p": 0.3,
|
| 55 |
+
"drop_landsat_p": 0.3,
|
| 56 |
+
"distill_weight": 1.0,
|
| 57 |
+
"distill_every": 1,
|
| 58 |
+
"distill_teacher_patch_size": 4,
|
| 59 |
+
"distill_teacher_expected_hw": 64,
|
| 60 |
+
"distill_teacher_timesteps": 1,
|
| 61 |
+
"distill_olmoearth_src_dir": "/workspace/Spatial/olmoearth_pretrain",
|
| 62 |
+
"distill_olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 63 |
+
"distill_olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth",
|
| 64 |
+
"run": "dummy",
|
| 65 |
+
"device_type": "",
|
| 66 |
+
"num_iterations": 2000,
|
| 67 |
+
"device_batch_size": 2,
|
| 68 |
+
"grad_accum_steps": 8,
|
| 69 |
+
"lr": 0.0001,
|
| 70 |
+
"weight_decay": 0.05,
|
| 71 |
+
"adam_beta1": 0.9,
|
| 72 |
+
"adam_beta2": 0.95,
|
| 73 |
+
"warmup_ratio": 0.01,
|
| 74 |
+
"warmdown_ratio": 0.4,
|
| 75 |
+
"final_lr_frac": 0.0,
|
| 76 |
+
"grad_clip": 1.0,
|
| 77 |
+
"resume_from_step": 200,
|
| 78 |
+
"init_from_model_tag": "",
|
| 79 |
+
"init_from_step": -1,
|
| 80 |
+
"init_from_model_path": "",
|
| 81 |
+
"init_nonstrict": false,
|
| 82 |
+
"freeze_blocks": false,
|
| 83 |
+
"freeze_final_norm": false,
|
| 84 |
+
"freeze_recon_head": false,
|
| 85 |
+
"eval_every": 200,
|
| 86 |
+
"eval_steps": 25,
|
| 87 |
+
"save_every": 200,
|
| 88 |
+
"model_tag": "fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600"
|
| 89 |
+
},
|
| 90 |
+
"dataset_meta": {
|
| 91 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 92 |
+
"s2_key": "sentinel2_l2a",
|
| 93 |
+
"s1_key": "sentinel1",
|
| 94 |
+
"landsat_key": "landsat",
|
| 95 |
+
"num_timesteps": 12,
|
| 96 |
+
"timestep_strategy": "uniform",
|
| 97 |
+
"patch_size": 16,
|
| 98 |
+
"grid_size": 8,
|
| 99 |
+
"mask_ratio": 0.75,
|
| 100 |
+
"value_scales": {
|
| 101 |
+
"sentinel2_l2a": 0.0001,
|
| 102 |
+
"sentinel1": 1.0,
|
| 103 |
+
"landsat": 0.0001
|
| 104 |
+
},
|
| 105 |
+
"norm": {
|
| 106 |
+
"strategy": "computed",
|
| 107 |
+
"stats_file": "/workspace/Spatial/olmoearth_pretrain/olmoearth_pretrain/data/norm_configs/computed.json",
|
| 108 |
+
"std_multiplier": 2.0
|
| 109 |
+
},
|
| 110 |
+
"modalities": [
|
| 111 |
+
"sentinel2_l2a",
|
| 112 |
+
"sentinel1",
|
| 113 |
+
"landsat"
|
| 114 |
+
],
|
| 115 |
+
"modality_channels": {
|
| 116 |
+
"sentinel2_l2a": 12,
|
| 117 |
+
"sentinel1": 2,
|
| 118 |
+
"landsat": 11
|
| 119 |
+
},
|
| 120 |
+
"contrastive": {
|
| 121 |
+
"weight": 0.1,
|
| 122 |
+
"temp": 0.1,
|
| 123 |
+
"proj_dim": 256,
|
| 124 |
+
"queue_size": 4096,
|
| 125 |
+
"pooling": "mean_unmasked",
|
| 126 |
+
"spatial_aug": "flip_rotate",
|
| 127 |
+
"drop_s1_p": 0.3,
|
| 128 |
+
"drop_landsat_p": 0.3
|
| 129 |
+
},
|
| 130 |
+
"distill": {
|
| 131 |
+
"weight": 1.0,
|
| 132 |
+
"every": 1,
|
| 133 |
+
"teacher_patch_size": 4,
|
| 134 |
+
"teacher_expected_hw": 64,
|
| 135 |
+
"teacher_timesteps": 1,
|
| 136 |
+
"olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 137 |
+
"olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth"
|
| 138 |
+
}
|
| 139 |
+
},
|
| 140 |
+
"grad_accum_steps": 8,
|
| 141 |
+
"dataloader_state_dict": {
|
| 142 |
+
"epoch": 1,
|
| 143 |
+
"seen_in_epoch": 7096,
|
| 144 |
+
"rank": 0
|
| 145 |
+
},
|
| 146 |
+
"loop_state": {
|
| 147 |
+
"min_val_loss": 0.004169567953795195,
|
| 148 |
+
"smooth_train_loss": 0.5826649194448699,
|
| 149 |
+
"total_training_time": 1072.7411074638367
|
| 150 |
+
}
|
| 151 |
+
}
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000600.json
ADDED
|
@@ -0,0 +1,151 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 600,
|
| 3 |
+
"model_type": "fm_vit",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"embed_dim": 768,
|
| 6 |
+
"depth": 12,
|
| 7 |
+
"num_heads": 12,
|
| 8 |
+
"mlp_ratio": 4.0,
|
| 9 |
+
"dropout": 0.0,
|
| 10 |
+
"attn_dropout": 0.0,
|
| 11 |
+
"patch_size": 16,
|
| 12 |
+
"modalities": [
|
| 13 |
+
"sentinel2_l2a",
|
| 14 |
+
"sentinel1",
|
| 15 |
+
"landsat"
|
| 16 |
+
],
|
| 17 |
+
"modality_channels": {
|
| 18 |
+
"sentinel2_l2a": 12,
|
| 19 |
+
"sentinel1": 2,
|
| 20 |
+
"landsat": 11
|
| 21 |
+
}
|
| 22 |
+
},
|
| 23 |
+
"user_config": {
|
| 24 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 25 |
+
"s2_key": "sentinel2_l2a",
|
| 26 |
+
"s1_key": "sentinel1",
|
| 27 |
+
"landsat_key": "landsat",
|
| 28 |
+
"num_timesteps": 12,
|
| 29 |
+
"timestep_strategy": "uniform",
|
| 30 |
+
"patch_size": 16,
|
| 31 |
+
"mask_ratio": 0.75,
|
| 32 |
+
"s2_value_scale": 0.0001,
|
| 33 |
+
"s1_value_scale": 1.0,
|
| 34 |
+
"landsat_value_scale": 0.0001,
|
| 35 |
+
"norm": "computed",
|
| 36 |
+
"norm_stats_file": "",
|
| 37 |
+
"norm_std_multiplier": 2.0,
|
| 38 |
+
"num_workers": 32,
|
| 39 |
+
"prefetch": 64,
|
| 40 |
+
"shuffle_buffer": 2000,
|
| 41 |
+
"depth": 12,
|
| 42 |
+
"embed_dim": 768,
|
| 43 |
+
"num_heads": 12,
|
| 44 |
+
"mlp_ratio": 4.0,
|
| 45 |
+
"dropout": 0.0,
|
| 46 |
+
"attn_dropout": 0.0,
|
| 47 |
+
"contrastive_weight": 0.1,
|
| 48 |
+
"contrastive_temp": 0.1,
|
| 49 |
+
"contrastive_proj_dim": 256,
|
| 50 |
+
"contrastive_lr": 0.001,
|
| 51 |
+
"contrastive_queue_size": 4096,
|
| 52 |
+
"contrastive_pooling": "mean_unmasked",
|
| 53 |
+
"spatial_aug": "flip_rotate",
|
| 54 |
+
"drop_s1_p": 0.3,
|
| 55 |
+
"drop_landsat_p": 0.3,
|
| 56 |
+
"distill_weight": 1.0,
|
| 57 |
+
"distill_every": 1,
|
| 58 |
+
"distill_teacher_patch_size": 4,
|
| 59 |
+
"distill_teacher_expected_hw": 64,
|
| 60 |
+
"distill_teacher_timesteps": 1,
|
| 61 |
+
"distill_olmoearth_src_dir": "/workspace/Spatial/olmoearth_pretrain",
|
| 62 |
+
"distill_olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 63 |
+
"distill_olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth",
|
| 64 |
+
"run": "dummy",
|
| 65 |
+
"device_type": "",
|
| 66 |
+
"num_iterations": 2000,
|
| 67 |
+
"device_batch_size": 2,
|
| 68 |
+
"grad_accum_steps": 8,
|
| 69 |
+
"lr": 0.0001,
|
| 70 |
+
"weight_decay": 0.05,
|
| 71 |
+
"adam_beta1": 0.9,
|
| 72 |
+
"adam_beta2": 0.95,
|
| 73 |
+
"warmup_ratio": 0.01,
|
| 74 |
+
"warmdown_ratio": 0.4,
|
| 75 |
+
"final_lr_frac": 0.0,
|
| 76 |
+
"grad_clip": 1.0,
|
| 77 |
+
"resume_from_step": 200,
|
| 78 |
+
"init_from_model_tag": "",
|
| 79 |
+
"init_from_step": -1,
|
| 80 |
+
"init_from_model_path": "",
|
| 81 |
+
"init_nonstrict": false,
|
| 82 |
+
"freeze_blocks": false,
|
| 83 |
+
"freeze_final_norm": false,
|
| 84 |
+
"freeze_recon_head": false,
|
| 85 |
+
"eval_every": 200,
|
| 86 |
+
"eval_steps": 25,
|
| 87 |
+
"save_every": 200,
|
| 88 |
+
"model_tag": "fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600"
|
| 89 |
+
},
|
| 90 |
+
"dataset_meta": {
|
| 91 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 92 |
+
"s2_key": "sentinel2_l2a",
|
| 93 |
+
"s1_key": "sentinel1",
|
| 94 |
+
"landsat_key": "landsat",
|
| 95 |
+
"num_timesteps": 12,
|
| 96 |
+
"timestep_strategy": "uniform",
|
| 97 |
+
"patch_size": 16,
|
| 98 |
+
"grid_size": 8,
|
| 99 |
+
"mask_ratio": 0.75,
|
| 100 |
+
"value_scales": {
|
| 101 |
+
"sentinel2_l2a": 0.0001,
|
| 102 |
+
"sentinel1": 1.0,
|
| 103 |
+
"landsat": 0.0001
|
| 104 |
+
},
|
| 105 |
+
"norm": {
|
| 106 |
+
"strategy": "computed",
|
| 107 |
+
"stats_file": "/workspace/Spatial/olmoearth_pretrain/olmoearth_pretrain/data/norm_configs/computed.json",
|
| 108 |
+
"std_multiplier": 2.0
|
| 109 |
+
},
|
| 110 |
+
"modalities": [
|
| 111 |
+
"sentinel2_l2a",
|
| 112 |
+
"sentinel1",
|
| 113 |
+
"landsat"
|
| 114 |
+
],
|
| 115 |
+
"modality_channels": {
|
| 116 |
+
"sentinel2_l2a": 12,
|
| 117 |
+
"sentinel1": 2,
|
| 118 |
+
"landsat": 11
|
| 119 |
+
},
|
| 120 |
+
"contrastive": {
|
| 121 |
+
"weight": 0.1,
|
| 122 |
+
"temp": 0.1,
|
| 123 |
+
"proj_dim": 256,
|
| 124 |
+
"queue_size": 4096,
|
| 125 |
+
"pooling": "mean_unmasked",
|
| 126 |
+
"spatial_aug": "flip_rotate",
|
| 127 |
+
"drop_s1_p": 0.3,
|
| 128 |
+
"drop_landsat_p": 0.3
|
| 129 |
+
},
|
| 130 |
+
"distill": {
|
| 131 |
+
"weight": 1.0,
|
| 132 |
+
"every": 1,
|
| 133 |
+
"teacher_patch_size": 4,
|
| 134 |
+
"teacher_expected_hw": 64,
|
| 135 |
+
"teacher_timesteps": 1,
|
| 136 |
+
"olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 137 |
+
"olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth"
|
| 138 |
+
}
|
| 139 |
+
},
|
| 140 |
+
"grad_accum_steps": 8,
|
| 141 |
+
"dataloader_state_dict": {
|
| 142 |
+
"epoch": 1,
|
| 143 |
+
"seen_in_epoch": 10563,
|
| 144 |
+
"rank": 0
|
| 145 |
+
},
|
| 146 |
+
"loop_state": {
|
| 147 |
+
"min_val_loss": 0.0038853464648127556,
|
| 148 |
+
"smooth_train_loss": 0.6179006408300746,
|
| 149 |
+
"total_training_time": 1919.8367457389832
|
| 150 |
+
}
|
| 151 |
+
}
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_000800.json
ADDED
|
@@ -0,0 +1,151 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 800,
|
| 3 |
+
"model_type": "fm_vit",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"embed_dim": 768,
|
| 6 |
+
"depth": 12,
|
| 7 |
+
"num_heads": 12,
|
| 8 |
+
"mlp_ratio": 4.0,
|
| 9 |
+
"dropout": 0.0,
|
| 10 |
+
"attn_dropout": 0.0,
|
| 11 |
+
"patch_size": 16,
|
| 12 |
+
"modalities": [
|
| 13 |
+
"sentinel2_l2a",
|
| 14 |
+
"sentinel1",
|
| 15 |
+
"landsat"
|
| 16 |
+
],
|
| 17 |
+
"modality_channels": {
|
| 18 |
+
"sentinel2_l2a": 12,
|
| 19 |
+
"sentinel1": 2,
|
| 20 |
+
"landsat": 11
|
| 21 |
+
}
|
| 22 |
+
},
|
| 23 |
+
"user_config": {
|
| 24 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 25 |
+
"s2_key": "sentinel2_l2a",
|
| 26 |
+
"s1_key": "sentinel1",
|
| 27 |
+
"landsat_key": "landsat",
|
| 28 |
+
"num_timesteps": 12,
|
| 29 |
+
"timestep_strategy": "uniform",
|
| 30 |
+
"patch_size": 16,
|
| 31 |
+
"mask_ratio": 0.75,
|
| 32 |
+
"s2_value_scale": 0.0001,
|
| 33 |
+
"s1_value_scale": 1.0,
|
| 34 |
+
"landsat_value_scale": 0.0001,
|
| 35 |
+
"norm": "computed",
|
| 36 |
+
"norm_stats_file": "",
|
| 37 |
+
"norm_std_multiplier": 2.0,
|
| 38 |
+
"num_workers": 32,
|
| 39 |
+
"prefetch": 64,
|
| 40 |
+
"shuffle_buffer": 2000,
|
| 41 |
+
"depth": 12,
|
| 42 |
+
"embed_dim": 768,
|
| 43 |
+
"num_heads": 12,
|
| 44 |
+
"mlp_ratio": 4.0,
|
| 45 |
+
"dropout": 0.0,
|
| 46 |
+
"attn_dropout": 0.0,
|
| 47 |
+
"contrastive_weight": 0.1,
|
| 48 |
+
"contrastive_temp": 0.1,
|
| 49 |
+
"contrastive_proj_dim": 256,
|
| 50 |
+
"contrastive_lr": 0.001,
|
| 51 |
+
"contrastive_queue_size": 4096,
|
| 52 |
+
"contrastive_pooling": "mean_unmasked",
|
| 53 |
+
"spatial_aug": "flip_rotate",
|
| 54 |
+
"drop_s1_p": 0.3,
|
| 55 |
+
"drop_landsat_p": 0.3,
|
| 56 |
+
"distill_weight": 1.0,
|
| 57 |
+
"distill_every": 1,
|
| 58 |
+
"distill_teacher_patch_size": 4,
|
| 59 |
+
"distill_teacher_expected_hw": 64,
|
| 60 |
+
"distill_teacher_timesteps": 1,
|
| 61 |
+
"distill_olmoearth_src_dir": "/workspace/Spatial/olmoearth_pretrain",
|
| 62 |
+
"distill_olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 63 |
+
"distill_olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth",
|
| 64 |
+
"run": "dummy",
|
| 65 |
+
"device_type": "",
|
| 66 |
+
"num_iterations": 2000,
|
| 67 |
+
"device_batch_size": 2,
|
| 68 |
+
"grad_accum_steps": 8,
|
| 69 |
+
"lr": 0.0001,
|
| 70 |
+
"weight_decay": 0.05,
|
| 71 |
+
"adam_beta1": 0.9,
|
| 72 |
+
"adam_beta2": 0.95,
|
| 73 |
+
"warmup_ratio": 0.01,
|
| 74 |
+
"warmdown_ratio": 0.4,
|
| 75 |
+
"final_lr_frac": 0.0,
|
| 76 |
+
"grad_clip": 1.0,
|
| 77 |
+
"resume_from_step": 200,
|
| 78 |
+
"init_from_model_tag": "",
|
| 79 |
+
"init_from_step": -1,
|
| 80 |
+
"init_from_model_path": "",
|
| 81 |
+
"init_nonstrict": false,
|
| 82 |
+
"freeze_blocks": false,
|
| 83 |
+
"freeze_final_norm": false,
|
| 84 |
+
"freeze_recon_head": false,
|
| 85 |
+
"eval_every": 200,
|
| 86 |
+
"eval_steps": 25,
|
| 87 |
+
"save_every": 200,
|
| 88 |
+
"model_tag": "fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600"
|
| 89 |
+
},
|
| 90 |
+
"dataset_meta": {
|
| 91 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 92 |
+
"s2_key": "sentinel2_l2a",
|
| 93 |
+
"s1_key": "sentinel1",
|
| 94 |
+
"landsat_key": "landsat",
|
| 95 |
+
"num_timesteps": 12,
|
| 96 |
+
"timestep_strategy": "uniform",
|
| 97 |
+
"patch_size": 16,
|
| 98 |
+
"grid_size": 8,
|
| 99 |
+
"mask_ratio": 0.75,
|
| 100 |
+
"value_scales": {
|
| 101 |
+
"sentinel2_l2a": 0.0001,
|
| 102 |
+
"sentinel1": 1.0,
|
| 103 |
+
"landsat": 0.0001
|
| 104 |
+
},
|
| 105 |
+
"norm": {
|
| 106 |
+
"strategy": "computed",
|
| 107 |
+
"stats_file": "/workspace/Spatial/olmoearth_pretrain/olmoearth_pretrain/data/norm_configs/computed.json",
|
| 108 |
+
"std_multiplier": 2.0
|
| 109 |
+
},
|
| 110 |
+
"modalities": [
|
| 111 |
+
"sentinel2_l2a",
|
| 112 |
+
"sentinel1",
|
| 113 |
+
"landsat"
|
| 114 |
+
],
|
| 115 |
+
"modality_channels": {
|
| 116 |
+
"sentinel2_l2a": 12,
|
| 117 |
+
"sentinel1": 2,
|
| 118 |
+
"landsat": 11
|
| 119 |
+
},
|
| 120 |
+
"contrastive": {
|
| 121 |
+
"weight": 0.1,
|
| 122 |
+
"temp": 0.1,
|
| 123 |
+
"proj_dim": 256,
|
| 124 |
+
"queue_size": 4096,
|
| 125 |
+
"pooling": "mean_unmasked",
|
| 126 |
+
"spatial_aug": "flip_rotate",
|
| 127 |
+
"drop_s1_p": 0.3,
|
| 128 |
+
"drop_landsat_p": 0.3
|
| 129 |
+
},
|
| 130 |
+
"distill": {
|
| 131 |
+
"weight": 1.0,
|
| 132 |
+
"every": 1,
|
| 133 |
+
"teacher_patch_size": 4,
|
| 134 |
+
"teacher_expected_hw": 64,
|
| 135 |
+
"teacher_timesteps": 1,
|
| 136 |
+
"olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 137 |
+
"olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth"
|
| 138 |
+
}
|
| 139 |
+
},
|
| 140 |
+
"grad_accum_steps": 8,
|
| 141 |
+
"dataloader_state_dict": {
|
| 142 |
+
"epoch": 1,
|
| 143 |
+
"seen_in_epoch": 14021,
|
| 144 |
+
"rank": 0
|
| 145 |
+
},
|
| 146 |
+
"loop_state": {
|
| 147 |
+
"min_val_loss": 0.0038853464648127556,
|
| 148 |
+
"smooth_train_loss": 0.6381232904570697,
|
| 149 |
+
"total_training_time": 2826.1666457653046
|
| 150 |
+
}
|
| 151 |
+
}
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/meta_001000.json
ADDED
|
@@ -0,0 +1,151 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 1000,
|
| 3 |
+
"model_type": "fm_vit",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"embed_dim": 768,
|
| 6 |
+
"depth": 12,
|
| 7 |
+
"num_heads": 12,
|
| 8 |
+
"mlp_ratio": 4.0,
|
| 9 |
+
"dropout": 0.0,
|
| 10 |
+
"attn_dropout": 0.0,
|
| 11 |
+
"patch_size": 16,
|
| 12 |
+
"modalities": [
|
| 13 |
+
"sentinel2_l2a",
|
| 14 |
+
"sentinel1",
|
| 15 |
+
"landsat"
|
| 16 |
+
],
|
| 17 |
+
"modality_channels": {
|
| 18 |
+
"sentinel2_l2a": 12,
|
| 19 |
+
"sentinel1": 2,
|
| 20 |
+
"landsat": 11
|
| 21 |
+
}
|
| 22 |
+
},
|
| 23 |
+
"user_config": {
|
| 24 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 25 |
+
"s2_key": "sentinel2_l2a",
|
| 26 |
+
"s1_key": "sentinel1",
|
| 27 |
+
"landsat_key": "landsat",
|
| 28 |
+
"num_timesteps": 12,
|
| 29 |
+
"timestep_strategy": "uniform",
|
| 30 |
+
"patch_size": 16,
|
| 31 |
+
"mask_ratio": 0.75,
|
| 32 |
+
"s2_value_scale": 0.0001,
|
| 33 |
+
"s1_value_scale": 1.0,
|
| 34 |
+
"landsat_value_scale": 0.0001,
|
| 35 |
+
"norm": "computed",
|
| 36 |
+
"norm_stats_file": "",
|
| 37 |
+
"norm_std_multiplier": 2.0,
|
| 38 |
+
"num_workers": 32,
|
| 39 |
+
"prefetch": 64,
|
| 40 |
+
"shuffle_buffer": 2000,
|
| 41 |
+
"depth": 12,
|
| 42 |
+
"embed_dim": 768,
|
| 43 |
+
"num_heads": 12,
|
| 44 |
+
"mlp_ratio": 4.0,
|
| 45 |
+
"dropout": 0.0,
|
| 46 |
+
"attn_dropout": 0.0,
|
| 47 |
+
"contrastive_weight": 0.1,
|
| 48 |
+
"contrastive_temp": 0.1,
|
| 49 |
+
"contrastive_proj_dim": 256,
|
| 50 |
+
"contrastive_lr": 0.001,
|
| 51 |
+
"contrastive_queue_size": 4096,
|
| 52 |
+
"contrastive_pooling": "mean_unmasked",
|
| 53 |
+
"spatial_aug": "flip_rotate",
|
| 54 |
+
"drop_s1_p": 0.3,
|
| 55 |
+
"drop_landsat_p": 0.3,
|
| 56 |
+
"distill_weight": 1.0,
|
| 57 |
+
"distill_every": 1,
|
| 58 |
+
"distill_teacher_patch_size": 4,
|
| 59 |
+
"distill_teacher_expected_hw": 64,
|
| 60 |
+
"distill_teacher_timesteps": 1,
|
| 61 |
+
"distill_olmoearth_src_dir": "/workspace/Spatial/olmoearth_pretrain",
|
| 62 |
+
"distill_olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 63 |
+
"distill_olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth",
|
| 64 |
+
"run": "dummy",
|
| 65 |
+
"device_type": "",
|
| 66 |
+
"num_iterations": 2000,
|
| 67 |
+
"device_batch_size": 2,
|
| 68 |
+
"grad_accum_steps": 8,
|
| 69 |
+
"lr": 0.0001,
|
| 70 |
+
"weight_decay": 0.05,
|
| 71 |
+
"adam_beta1": 0.9,
|
| 72 |
+
"adam_beta2": 0.95,
|
| 73 |
+
"warmup_ratio": 0.01,
|
| 74 |
+
"warmdown_ratio": 0.4,
|
| 75 |
+
"final_lr_frac": 0.0,
|
| 76 |
+
"grad_clip": 1.0,
|
| 77 |
+
"resume_from_step": 200,
|
| 78 |
+
"init_from_model_tag": "",
|
| 79 |
+
"init_from_step": -1,
|
| 80 |
+
"init_from_model_path": "",
|
| 81 |
+
"init_nonstrict": false,
|
| 82 |
+
"freeze_blocks": false,
|
| 83 |
+
"freeze_final_norm": false,
|
| 84 |
+
"freeze_recon_head": false,
|
| 85 |
+
"eval_every": 200,
|
| 86 |
+
"eval_steps": 25,
|
| 87 |
+
"save_every": 200,
|
| 88 |
+
"model_tag": "fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600"
|
| 89 |
+
},
|
| 90 |
+
"dataset_meta": {
|
| 91 |
+
"h5_dir": "/workspace/olmoearth/h5_shards",
|
| 92 |
+
"s2_key": "sentinel2_l2a",
|
| 93 |
+
"s1_key": "sentinel1",
|
| 94 |
+
"landsat_key": "landsat",
|
| 95 |
+
"num_timesteps": 12,
|
| 96 |
+
"timestep_strategy": "uniform",
|
| 97 |
+
"patch_size": 16,
|
| 98 |
+
"grid_size": 8,
|
| 99 |
+
"mask_ratio": 0.75,
|
| 100 |
+
"value_scales": {
|
| 101 |
+
"sentinel2_l2a": 0.0001,
|
| 102 |
+
"sentinel1": 1.0,
|
| 103 |
+
"landsat": 0.0001
|
| 104 |
+
},
|
| 105 |
+
"norm": {
|
| 106 |
+
"strategy": "computed",
|
| 107 |
+
"stats_file": "/workspace/Spatial/olmoearth_pretrain/olmoearth_pretrain/data/norm_configs/computed.json",
|
| 108 |
+
"std_multiplier": 2.0
|
| 109 |
+
},
|
| 110 |
+
"modalities": [
|
| 111 |
+
"sentinel2_l2a",
|
| 112 |
+
"sentinel1",
|
| 113 |
+
"landsat"
|
| 114 |
+
],
|
| 115 |
+
"modality_channels": {
|
| 116 |
+
"sentinel2_l2a": 12,
|
| 117 |
+
"sentinel1": 2,
|
| 118 |
+
"landsat": 11
|
| 119 |
+
},
|
| 120 |
+
"contrastive": {
|
| 121 |
+
"weight": 0.1,
|
| 122 |
+
"temp": 0.1,
|
| 123 |
+
"proj_dim": 256,
|
| 124 |
+
"queue_size": 4096,
|
| 125 |
+
"pooling": "mean_unmasked",
|
| 126 |
+
"spatial_aug": "flip_rotate",
|
| 127 |
+
"drop_s1_p": 0.3,
|
| 128 |
+
"drop_landsat_p": 0.3
|
| 129 |
+
},
|
| 130 |
+
"distill": {
|
| 131 |
+
"weight": 1.0,
|
| 132 |
+
"every": 1,
|
| 133 |
+
"teacher_patch_size": 4,
|
| 134 |
+
"teacher_expected_hw": 64,
|
| 135 |
+
"teacher_timesteps": 1,
|
| 136 |
+
"olmoearth_config": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/config.json",
|
| 137 |
+
"olmoearth_weights": "/workspace/Spatial/nanochat_artifacts/teachers/olmoearth_v1_large/weights.pth"
|
| 138 |
+
}
|
| 139 |
+
},
|
| 140 |
+
"grad_accum_steps": 8,
|
| 141 |
+
"dataloader_state_dict": {
|
| 142 |
+
"epoch": 1,
|
| 143 |
+
"seen_in_epoch": 17492,
|
| 144 |
+
"rank": 0
|
| 145 |
+
},
|
| 146 |
+
"loop_state": {
|
| 147 |
+
"min_val_loss": 0.0038853464648127556,
|
| 148 |
+
"smooth_train_loss": 0.6192801710915687,
|
| 149 |
+
"total_training_time": 3731.589139699936
|
| 150 |
+
}
|
| 151 |
+
}
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000200.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d87441ab6868defc06c58ccd5262adccd52d76ba9d3bb1793c7c52238b4db87
|
| 3 |
+
size 606639149
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000400.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23b78e71c80c0108e6d4b9c638065bd7b60d03a85c88fbe399b517174afd0df6
|
| 3 |
+
size 606639149
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000600.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7376e69ad4de8eb6a7e4c3483066ebc5a0f348699110e980ac4b67a27634eefa
|
| 3 |
+
size 606639149
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_000800.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b384b1cf52d8d8b27b76bc66d5775e684524bb3a86d191aa860bfa0780abd0c
|
| 3 |
+
size 606639149
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/model_001000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e6f14e39243e82ba708b2a1ff146cf97ea2646bcccff3d5f283af28ac99185a
|
| 3 |
+
size 606639149
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ac3a40498b771a7abbba3fa744584b21fa804d31328d466bfc9440444a92c32
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad2ff60ba3db865d3ce5417cac821baa0daf54a924cb617cbad7566f06726bd8
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da426b7dc0abdd7173fff13ddae369dfdca908ff4917bc62dafa5dc61eecb281
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:317e661fab992267b485b3394c80eeba47ffccab6c6acab54be5276778701438
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b43bd0557a417d82c7f2628adf2293143603d95ea895e53d5882fee0e9a7e6e5
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51940e8955cedf709c25323ee6375541cfa223f11a656848f225c77f26514f39
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36b6391f839335ac4e43fa464cb95cd59145e12743a53969d0d17eab9960e6f6
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000200_rank7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecf3aead879f1b5201e72fbc1b02b05f5c66957b6276f8be1a12816a2aa55924
|
| 3 |
+
size 1215416583
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b95dc81a798c7885e412f82e5142cb78ca5ecb2e16946c1579604c8caef671e
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0686dba9c86316347abc0a1582732b06530f94971d2e54d447ddc62c25d5404b
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d23049336844dca290144dbc02b5c7de712c9e62bc2bbab71c7c1dfe771f310c
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8e4d5938e1b117974517850df9d8ea8ade57f6e2b1b3891b71227b1cc6880fd
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f23d6ae5367dcfe6178aa1484bd60a69fa4bcfac6782874e0786009f0f1791b1
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d76ac5e48d8340b011e966b844af5f2b60a8283f08a4ebb47d8dc657eff11813
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfde9d1285163c01413d3294542be593400427642d1a7b8d1cff7b320ea547bf
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000400_rank7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f7ad0ab3dc046a1f9451b007cc1347786834b3c298bbde44aaeeb81cb487aeb
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d6442918198a86968bd539d0850d58893ba2281dd1239f14fa0cfb69b1922c2
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ec27580dd1377cb965dc12d72931a6fc74bb35f792bdece63ad6718181767fa
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4cd9757040b5348d3767fb08a15f89b18d319949ec1c0f9de48131d5c12c4d2
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4833d7622a8ed9f3225aeadb425807e25f9a4d6a545fb1fde9a37b4c7b660c65
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af42121dfeb505e46801f746f6a7a34f7b686c750b31d9127e2501bf8d282522
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbeeed92114be0c43019e17a4caaeda4cf31c08fe8a6c133675033c71ec3c1c1
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32903b2e47c2eb24292b125dc85e6a6680c4caf125f29dc070f2a758875e5226
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000600_rank7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:adedeeb6afd87ef13c2d77f073c5e4352b5dc55c7c5302d45f803323f2557bf4
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97bd9da90cf51217ec3ffa3a4a8a787db6c2fafa07278c169a2e830b80ebfc3b
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef91178743897c6f1d41bceae6dd6e065cdecbdfd0eef827bb0fc1ecaf80c6d4
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b0af289e3ececd96d97293d75e785c32397e80b078e187f3ba9138abcfa66b8
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:420a4c17fb181e7904d5fa82d63f8ec938a3d1bba80aec9ef45b476cbff4b4d5
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7e7c17cf75474fd8b1fa1cbad491a1af122ac486c1755a933a4875344a8867d
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08bc0f15393a916d0864f5e6e014ba456e679a3fec54a606a2275ad375f302c1
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b654740c98b25ce21878119d7c08acda2e0c5659ea9733ed0cb9515dc76073e2
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_000800_rank7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60ebfaea500e8288a9b0df0c7d459661f7f2bab9ebe6f7f460d40e10afb862e7
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13e13e2ffc505bd79993bd3bb5b94bb15851df1c007fba832a88ba03d6563dd4
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd27c98e03ad3eb4fbd2ab1843535dc3b4042f2d324151885f32dbe94c5aaa19
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e667ac7d754528f5882587a9e907e68c0d322295bc9ed14b90eb11b0ef97cee
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8053f5f5b90ec12044a91e08a17fc22cb0e0fe4acf5df21174e41ab350aad78
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e74cc9b57b6123db83d87bbf965f5e3fe6dc3eb39a2fad8089ddc7dbb95f918c
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5f02a04fe45ada359c95101b2bc16f6f9d77793d9f14ad752eaf2ef813402d5
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:deb403fd0a1369860273bda7fde8de5371110f86c0329751f5e4c94f5943d95f
|
| 3 |
+
size 1215420871
|
fm_checkpoints/fmvit_d12_e768_ps16_normcomputed_contrast_oeLarge_from2600/optim_001000_rank7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:031dee9917fc3d5d343f9cea9e8098b604edaaeaf1d1b86c431f00ef55e027db
|
| 3 |
+
size 1215420871
|