Upload checkpoint from unified script: step_750
Browse files- config.json +5 -5
- model.safetensors +2 -2
- training_state.pt +2 -2
config.json
CHANGED
|
@@ -103,23 +103,23 @@
|
|
| 103 |
"r8c8": "<row_8_col_8>"
|
| 104 |
},
|
| 105 |
"vlm_load_backbone_weights": true,
|
| 106 |
-
"use_kv_bridge":
|
| 107 |
"kv_bridge_mode": "identity",
|
| 108 |
"kv_bridge_affine_stack_depth": 1,
|
| 109 |
"kv_bridge_adapter_expansion_factor": 1.0,
|
| 110 |
-
"kv_bridge_use_gate":
|
| 111 |
},
|
| 112 |
"train_cfg": {
|
| 113 |
"lr_mp": 5e-05,
|
| 114 |
"lr_vision_backbone": 0.0,
|
| 115 |
-
"lr_language_backbone":
|
| 116 |
"lr_right_tower": 0.0,
|
| 117 |
-
"lr_kv_bridge": 0.
|
| 118 |
"batch_size": 8,
|
| 119 |
"gradient_accumulation_steps": 16,
|
| 120 |
"max_grad_norm": 1.0,
|
| 121 |
"max_training_steps": 2000,
|
| 122 |
-
"warmup_ratio": 0.
|
| 123 |
"stats_log_interval": 100,
|
| 124 |
"compile": false,
|
| 125 |
"eval_in_epochs": false,
|
|
|
|
| 103 |
"r8c8": "<row_8_col_8>"
|
| 104 |
},
|
| 105 |
"vlm_load_backbone_weights": true,
|
| 106 |
+
"use_kv_bridge": false,
|
| 107 |
"kv_bridge_mode": "identity",
|
| 108 |
"kv_bridge_affine_stack_depth": 1,
|
| 109 |
"kv_bridge_adapter_expansion_factor": 1.0,
|
| 110 |
+
"kv_bridge_use_gate": false
|
| 111 |
},
|
| 112 |
"train_cfg": {
|
| 113 |
"lr_mp": 5e-05,
|
| 114 |
"lr_vision_backbone": 0.0,
|
| 115 |
+
"lr_language_backbone": 5e-05,
|
| 116 |
"lr_right_tower": 0.0,
|
| 117 |
+
"lr_kv_bridge": 0.0,
|
| 118 |
"batch_size": 8,
|
| 119 |
"gradient_accumulation_steps": 16,
|
| 120 |
"max_grad_norm": 1.0,
|
| 121 |
"max_training_steps": 2000,
|
| 122 |
+
"warmup_ratio": 0.03,
|
| 123 |
"stats_log_interval": 100,
|
| 124 |
"compile": false,
|
| 125 |
"eval_in_epochs": false,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82cb2c98139194e0186b99a5f9a8b9500d87793a27f534f624129628bbf9e42f
|
| 3 |
+
size 1450578848
|
training_state.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4220fe8d71f97014d122f580ceaba6cef4c731f51549fb5ce1abc5b57f0a3638
|
| 3 |
+
size 1106724543
|