BayesTensor commited on
Commit
f0d4d04
·
verified ·
1 Parent(s): b69aa7c

Training in progress, epoch 17, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd4ebc19581170d4e3e2289f89a6b6b5d0f29626415fdc205ee019874c846d0d
3
  size 598439784
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34a34dbc85953b1cdb0bbdaeaaa03b802543a05a24f2a310fb563e061abb91e3
3
  size 598439784
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8ac87d06385767c09b376f483d886f26b33863219332f0831983eb51aff3b09
3
  size 1196967418
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d512c13bd93229b894e041a4d4fbf657700c4467bba68b92fa186e623ee6417
3
  size 1196967418
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:913ac14e71df2a85f158bf8200b2600b5f905ccb544ef3db6dcd4313366367a9
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b32902f8553b01c87284a6114f412e32aef4bacd0c7545b1d42159c57be6ff4b
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2c831d2844bae6e5dfcbb7cfa2b1a0346a9004d27558539b670e94dfda48813
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c19e7df21c0f0cd8077c7593f632ab8849023b3e4e1c28f2e05b1b3ded8bfeb
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.8181082820112143,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-1196",
4
- "epoch": 16.0,
5
  "eval_steps": 500,
6
- "global_step": 1472,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -249,6 +249,22 @@
249
  "eval_samples_per_second": 12.694,
250
  "eval_steps_per_second": 3.174,
251
  "step": 1472
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
252
  }
253
  ],
254
  "logging_steps": 100,
@@ -268,7 +284,7 @@
268
  "attributes": {}
269
  }
270
  },
271
- "total_flos": 1.0105599870912e+16,
272
  "train_batch_size": 4,
273
  "trial_name": null,
274
  "trial_params": null
 
1
  {
2
  "best_metric": 0.8181082820112143,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-1196",
4
+ "epoch": 17.0,
5
  "eval_steps": 500,
6
+ "global_step": 1564,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
249
  "eval_samples_per_second": 12.694,
250
  "eval_steps_per_second": 3.174,
251
  "step": 1472
252
+ },
253
+ {
254
+ "epoch": 16.304347826086957,
255
+ "grad_norm": 0.004443590063601732,
256
+ "learning_rate": 1.739130434782609e-05,
257
+ "loss": 0.0764,
258
+ "step": 1500
259
+ },
260
+ {
261
+ "epoch": 17.0,
262
+ "eval_f1": 0.7634584417193113,
263
+ "eval_loss": 1.5010850429534912,
264
+ "eval_runtime": 7.2861,
265
+ "eval_samples_per_second": 12.627,
266
+ "eval_steps_per_second": 3.157,
267
+ "step": 1564
268
  }
269
  ],
270
  "logging_steps": 100,
 
284
  "attributes": {}
285
  }
286
  },
287
+ "total_flos": 1.0737199862844e+16,
288
  "train_batch_size": 4,
289
  "trial_name": null,
290
  "trial_params": null