pilotj commited on
Commit
1903ba4
·
verified ·
1 Parent(s): e9fdf72

Training in progress, step 5500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:685d53982b27eb365dec7e10b5430fca13c6e0fa7574169dc00b5b61713d4d8e
3
  size 498686648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27b44157417e39f37d53f97660159534caa17c9e92cc0fcc65d26cdc58df41c2
3
  size 498686648
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e480ea2c1707535961a915ad7d0c076244f7d677a129489077a8242a2b9126a7
3
  size 997493050
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0a598fbe7a9896408099f5b9156dc689745bd20c4fc91ba85bea8bdd2ed788e
3
  size 997493050
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e46df96471f815a1d294c24fe73c8ab67a0d41f321e80dcd299bde46010e94cf
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c44ae4ad313b4be83c6fe4120f4de7b8df0b41f03db919b420b2e256111040f7
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e4b999bc7117f5e365eaf55ab190141de7aaca3ce426abdc3f6d80268e7bf79
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1756636f56007ccf3026f60661401a9b281d6ff9e2176d95116df6815604e882
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.46239224076271057,
3
- "best_model_checkpoint": "results/checkpoint-4500",
4
- "epoch": 0.474068455484972,
5
  "eval_steps": 500,
6
- "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -207,6 +207,26 @@
207
  "eval_samples_per_second": 59.804,
208
  "eval_steps_per_second": 0.469,
209
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
210
  }
211
  ],
212
  "logging_steps": 500,
@@ -226,7 +246,7 @@
226
  "attributes": {}
227
  }
228
  },
229
- "total_flos": 8.421368070144e+16,
230
  "train_batch_size": 32,
231
  "trial_name": null,
232
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.45522668957710266,
3
+ "best_model_checkpoint": "results/checkpoint-5500",
4
+ "epoch": 0.5214753010334693,
5
  "eval_steps": 500,
6
+ "global_step": 5500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
207
  "eval_samples_per_second": 59.804,
208
  "eval_steps_per_second": 0.469,
209
  "step": 5000
210
+ },
211
+ {
212
+ "epoch": 0.5214753010334693,
213
+ "grad_norm": 426242.5,
214
+ "learning_rate": 1.9140987958661234e-05,
215
+ "loss": 0.5104,
216
+ "step": 5500
217
+ },
218
+ {
219
+ "epoch": 0.5214753010334693,
220
+ "eval_accuracy": 0.868323910097659,
221
+ "eval_f1_macro": 0.8363938907947726,
222
+ "eval_f1_w": 0.8695247067175498,
223
+ "eval_loss": 0.45522668957710266,
224
+ "eval_precision": 0.8726509048119306,
225
+ "eval_recall": 0.868323910097659,
226
+ "eval_runtime": 357.8353,
227
+ "eval_samples_per_second": 59.807,
228
+ "eval_steps_per_second": 0.469,
229
+ "step": 5500
230
  }
231
  ],
232
  "logging_steps": 500,
 
246
  "attributes": {}
247
  }
248
  },
249
+ "total_flos": 9.2635048771584e+16,
250
  "train_batch_size": 32,
251
  "trial_name": null,
252
  "trial_params": null