SystemAdmin123 commited on
Commit
f5d693e
·
verified ·
1 Parent(s): eefac5f

Training in progress, step 180, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:057b49db93b4bb11e49863668fa73539c65d76cca34601fff825c1691bb64851
3
  size 2471645608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c2c0a790064775147df67e3ddcfd62e11584f5aea3f1a9de0417622cbf9c7d4
3
  size 2471645608
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d304751a2ea1c94cc1b9b0de681233ea14fc47a301587cfdabe4ca3c3d0e44bc
3
  size 2510806010
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06e4829f9e6629891612b81adb97f878de5fd94c2d2fe978b940f5f80ac0f305
3
  size 2510806010
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56b323eece943c8be03268f2f2cd0f5781052da6f4d6e81974e7dc0391e6f9b0
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5de519c5e2e0ec73ae4a10a32ec71c2d0d5d3982d1fbb16434177a93460b8139
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8a5396b6ce82a1fa517dfb220ab4ae7fd088b5d9659632b81104386db9d3bac
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e120a86fc85c4349ce6a6d226cf9080af7941a4f32f9239b536f491d778e55d1
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:507e713485c774580f6a9da657c78542ed7cbfe40136e2096ef127927ec8b96e
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:420919d56d937c6944ec2c4a3a5402e03840612d53e7914b441877be496558d6
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac3c203718bd461046b02f6c1bbd4eca077b667406a41352c7b69bf3764ca88c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fbf96f9883e64cb2ab53f35f353ba99bb51455ec52fb6e4f630fe95a589598d
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91ab173e3ec81f1fcc90a5bec767634b3731350aacc0be314a1243781b9ad361
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f30eaafe84a25fe4a9dc5723bc034c2757e284325f5eef16f6d75d1c5a09576
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 9.411764705882353,
5
  "eval_steps": 20,
6
- "global_step": 160,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -191,6 +191,28 @@
191
  "eval_samples_per_second": 96.468,
192
  "eval_steps_per_second": 2.249,
193
  "step": 160
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
194
  }
195
  ],
196
  "logging_steps": 10,
@@ -210,7 +232,7 @@
210
  "attributes": {}
211
  }
212
  },
213
- "total_flos": 8.344306217648128e+16,
214
  "train_batch_size": 11,
215
  "trial_name": null,
216
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.588235294117647,
5
  "eval_steps": 20,
6
+ "global_step": 180,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
191
  "eval_samples_per_second": 96.468,
192
  "eval_steps_per_second": 2.249,
193
  "step": 160
194
+ },
195
+ {
196
+ "epoch": 10.0,
197
+ "grad_norm": 0.62109375,
198
+ "learning_rate": 0.00013246994692046836,
199
+ "loss": 0.0373,
200
+ "step": 170
201
+ },
202
+ {
203
+ "epoch": 10.588235294117647,
204
+ "grad_norm": 0.349609375,
205
+ "learning_rate": 0.00012454854871407994,
206
+ "loss": 0.0152,
207
+ "step": 180
208
+ },
209
+ {
210
+ "epoch": 10.588235294117647,
211
+ "eval_loss": 3.9090092182159424,
212
+ "eval_runtime": 15.4377,
213
+ "eval_samples_per_second": 97.23,
214
+ "eval_steps_per_second": 2.267,
215
+ "step": 180
216
  }
217
  ],
218
  "logging_steps": 10,
 
232
  "attributes": {}
233
  }
234
  },
235
+ "total_flos": 9.389437170692915e+16,
236
  "train_batch_size": 11,
237
  "trial_name": null,
238
  "trial_params": null