Training in progress, epoch 8, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee6d0a0d1ba196c8ccf73fe46078bafa455bffb6853f62431c24e8c68ef38678
 size 283195372

 version https://git-lfs.github.com/spec/v1
+oid sha256:dffdaa18d490862a5baa34f1aa1bc200d0d828239d6937759dba871204f96647
 size 283195372

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:332d17b5e57c17ea68145eaf3eb2e4d742f697c48a07f22b9669c31a70d2c7d5
 size 566510586

 version https://git-lfs.github.com/spec/v1
+oid sha256:4058832662a554684058259749c60029406d0e939fd4f2354ba6001345e6670b
 size 566510586

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4cdbe556a15488115b67033be7756c22ee46c44dc8550421fe1e87784e89a4b3
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:0403b973607a11ec8e102f5d54893b1b4bd95322e3f79eb6b0f5e4a601f67d63
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:09e5fd8384f36863e16c6caa18ce6d31e617ce30791085f2827d0277f3f4cbca
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:97cf51aabce7093c5fba6ba591e23e2496121cbddbeffe19a8366acfe3aafef1
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 0.34553440702781846,
   "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-24",
-  "epoch": 8.0,
   "eval_steps": 500,
-  "global_step": 199,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -79,6 +79,15 @@
       "eval_samples_per_second": 139.235,
       "eval_steps_per_second": 8.766,
       "step": 199
     }
   ],
   "logging_steps": 500,
@@ -98,7 +107,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1671445714567680.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 0.34553440702781846,
   "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-24",
+  "epoch": 8.964824120603016,
   "eval_steps": 500,
+  "global_step": 223,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 139.235,
       "eval_steps_per_second": 8.766,
       "step": 199
+    },
+    {
+      "epoch": 8.964824120603016,
+      "eval_accuracy": 0.4128843338213763,
+      "eval_loss": 1.072035551071167,
+      "eval_runtime": 9.4031,
+      "eval_samples_per_second": 145.27,
+      "eval_steps_per_second": 9.146,
+      "step": 223
     }
   ],
   "logging_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 1880376428888640.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null