BayesTensor commited on
Commit
72ccc2c
·
verified ·
1 Parent(s): 530635e

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77bc596fba1eaefecb79510ac76ae8a790122557a720d1c3fba802366d309ad7
3
  size 598439784
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74874d52f7cbbfa76ffc7607401873f007ee833060bc619b6e5d44da8f7ca856
3
  size 598439784
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaa31c74dffb446932954321bc66ebd6b0b5820b11f76b30c1cde8aac29e62db
3
  size 1196967418
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88dbd6c5e3d796ad17799d4c8569579663913a90fafdcf88e07c396b8a6a9b5e
3
  size 1196967418
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2e155718eaa0de9768e57816e6e6874ba931ec4489afb1c2874db91c97f7a96
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee3528bf0ace792176d57cac1ea8e325db1e81a8856e3e8a6e53688b51f9516e
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40f7853ae8f9bd5119e6435e73044e4eaccdadd4c58eff5131a9bb8b91736361
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29515a795f42318c0b4340751f84ea735733a1e6cda14a74cb2f0c287dead1f9
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.5993395707209687,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-92",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 92,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -16,6 +16,22 @@
16
  "eval_samples_per_second": 12.927,
17
  "eval_steps_per_second": 3.232,
18
  "step": 92
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
  "logging_steps": 100,
@@ -35,7 +51,7 @@
35
  "attributes": {}
36
  }
37
  },
38
- "total_flos": 631599991932000.0,
39
  "train_batch_size": 4,
40
  "trial_name": null,
41
  "trial_params": null
 
1
  {
2
  "best_metric": 0.5993395707209687,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-92",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 184,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
16
  "eval_samples_per_second": 12.927,
17
  "eval_steps_per_second": 3.232,
18
  "step": 92
19
+ },
20
+ {
21
+ "epoch": 1.0869565217391304,
22
+ "grad_norm": 3.5607712268829346,
23
+ "learning_rate": 4.782608695652174e-05,
24
+ "loss": 0.7932,
25
+ "step": 100
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_f1": 0.5993395707209687,
30
+ "eval_loss": 0.6113200187683105,
31
+ "eval_runtime": 7.1729,
32
+ "eval_samples_per_second": 12.826,
33
+ "eval_steps_per_second": 3.206,
34
+ "step": 184
35
  }
36
  ],
37
  "logging_steps": 100,
 
51
  "attributes": {}
52
  }
53
  },
54
+ "total_flos": 1263199983864000.0,
55
  "train_batch_size": 4,
56
  "trial_name": null,
57
  "trial_params": null