patrickamadeus commited on
Commit
eba78f6
·
verified ·
1 Parent(s): 8784b51

Upload checkpoint from unified script: step_750

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. model.safetensors +2 -2
  3. training_state.pt +2 -2
config.json CHANGED
@@ -103,23 +103,23 @@
103
  "r8c8": "<row_8_col_8>"
104
  },
105
  "vlm_load_backbone_weights": true,
106
- "use_kv_bridge": true,
107
  "kv_bridge_mode": "identity",
108
  "kv_bridge_affine_stack_depth": 1,
109
  "kv_bridge_adapter_expansion_factor": 1.0,
110
- "kv_bridge_use_gate": true
111
  },
112
  "train_cfg": {
113
  "lr_mp": 5e-05,
114
  "lr_vision_backbone": 0.0,
115
- "lr_language_backbone": 1e-05,
116
  "lr_right_tower": 0.0,
117
- "lr_kv_bridge": 0.0001,
118
  "batch_size": 8,
119
  "gradient_accumulation_steps": 16,
120
  "max_grad_norm": 1.0,
121
  "max_training_steps": 2000,
122
- "warmup_ratio": 0.01,
123
  "stats_log_interval": 100,
124
  "compile": false,
125
  "eval_in_epochs": false,
 
103
  "r8c8": "<row_8_col_8>"
104
  },
105
  "vlm_load_backbone_weights": true,
106
+ "use_kv_bridge": false,
107
  "kv_bridge_mode": "identity",
108
  "kv_bridge_affine_stack_depth": 1,
109
  "kv_bridge_adapter_expansion_factor": 1.0,
110
+ "kv_bridge_use_gate": false
111
  },
112
  "train_cfg": {
113
  "lr_mp": 5e-05,
114
  "lr_vision_backbone": 0.0,
115
+ "lr_language_backbone": 5e-05,
116
  "lr_right_tower": 0.0,
117
+ "lr_kv_bridge": 0.0,
118
  "batch_size": 8,
119
  "gradient_accumulation_steps": 16,
120
  "max_grad_norm": 1.0,
121
  "max_training_steps": 2000,
122
+ "warmup_ratio": 0.03,
123
  "stats_log_interval": 100,
124
  "compile": false,
125
  "eval_in_epochs": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ad70d5eff599c3ca1dad724a4491b6e5ccfd51126e1a8df0eaca64d59ec3de1
3
- size 1450611792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82cb2c98139194e0186b99a5f9a8b9500d87793a27f534f624129628bbf9e42f
3
+ size 1450578848
training_state.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e4fd2e0e7b638aab2f27558b7fd21c5d8e81e77d9a0373e505e769a70d9e8fa
3
- size 1106791965
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4220fe8d71f97014d122f580ceaba6cef4c731f51549fb5ce1abc5b57f0a3638
3
+ size 1106724543