nttx commited on
Commit
eed8909
·
verified ·
1 Parent(s): 4e35c2f

Training in progress, step 3000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7350d1b2818baa194908d604eef7d306d0bfda5a977b25f0ba8f3ee19c68e643
3
  size 14696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7f5f69eb370fc7cd0e87c5a48e96b6953f6920201b31709ada4329d30f011a3
3
  size 14696
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1efe7f84caa469288758d729267e555e7d4959d5bd9b77991c6b054571b2b94e
3
  size 39462
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0d79ef4e6c5113b42eee59ebe99aca1e4a398804d179d3775d21f338ac28624
3
  size 39462
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1bfd7bc146b83962f8ea49d8335d7e42b9e02cb8c55d49480bb5d6fb1f3eb70
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4aefdcd16ebb09118c94fb4a5607a3f3423d69e946dd5477422923831fb7280
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c411a66287d4fb76303ae5ba8fbc6149ecf0ea6d0ba0f17e45b450c5260043f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:822b16bddd8bcf1ca02e61cd33e647684b752a55f3a3f365bbcb33421d66a2a5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 11.912158012390137,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-2700",
4
- "epoch": 4.511792945105406,
5
  "eval_steps": 300,
6
- "global_step": 2700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -150,6 +150,21 @@
150
  "eval_samples_per_second": 209.592,
151
  "eval_steps_per_second": 26.277,
152
  "step": 2700
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
153
  }
154
  ],
155
  "logging_steps": 300,
@@ -173,12 +188,12 @@
173
  "should_evaluate": false,
174
  "should_log": false,
175
  "should_save": true,
176
- "should_training_stop": false
177
  },
178
  "attributes": {}
179
  }
180
  },
181
- "total_flos": 5104572825600.0,
182
  "train_batch_size": 8,
183
  "trial_name": null,
184
  "trial_params": null
 
1
  {
2
+ "best_metric": 11.912154197692871,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-3000",
4
+ "epoch": 5.01356710498852,
5
  "eval_steps": 300,
6
+ "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
150
  "eval_samples_per_second": 209.592,
151
  "eval_steps_per_second": 26.277,
152
  "step": 2700
153
+ },
154
+ {
155
+ "epoch": 5.01356710498852,
156
+ "grad_norm": 0.012090091593563557,
157
+ "learning_rate": 0.0,
158
+ "loss": 11.9374,
159
+ "step": 3000
160
+ },
161
+ {
162
+ "epoch": 5.01356710498852,
163
+ "eval_loss": 11.912154197692871,
164
+ "eval_runtime": 9.5524,
165
+ "eval_samples_per_second": 211.256,
166
+ "eval_steps_per_second": 26.485,
167
+ "step": 3000
168
  }
169
  ],
170
  "logging_steps": 300,
 
188
  "should_evaluate": false,
189
  "should_log": false,
190
  "should_save": true,
191
+ "should_training_stop": true
192
  },
193
  "attributes": {}
194
  }
195
  },
196
+ "total_flos": 5671747584000.0,
197
  "train_batch_size": 8,
198
  "trial_name": null,
199
  "trial_params": null