Training in progress, epoch 10, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8557197285aa474040732b3faf52393778ccfe00bf2845374700a5667bdcd056
 size 2239622772

 version https://git-lfs.github.com/spec/v1
+oid sha256:600761be52ca5f8db7b1334e95cc98070d6a77518b8aef9e2d41a06a93813d47
 size 2239622772

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c5e59aaa067c95b6cfddb464e72f58685323c6ab29970b47228c7420a4a065fc
 size 4479480977

 version https://git-lfs.github.com/spec/v1
+oid sha256:e48bb9dc117514bc0dd0c5074802d86ef6e9b63d3a18daa3fc6203097bf99ad7
 size 4479480977

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cec783a1bdc155c6d7712fc7ca4a10a43873c934e423ff7ca10b82cc4bb429b4
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:0dd7a61559d056ff5d2702c0055be5ae53afa45081a941a0da65d1e175fc5c8d
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68b8fc6c968c09b32ebacd5345c995f5b98e128622b1e398ff34fccb1711fb5a
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c8e0f1f62b73393c8041520b56b5aed263e50a6773914fd4a6c488106230884
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 0.7774524158125915,
   "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-796",
-  "epoch": 9.0,
   "eval_steps": 500,
-  "global_step": 1791,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -109,6 +109,15 @@
       "eval_samples_per_second": 12.032,
       "eval_steps_per_second": 6.016,
       "step": 1791
     }
   ],
   "logging_steps": 500,
@@ -123,12 +132,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 2.660119696008864e+16,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 0.7774524158125915,
   "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-796",
+  "epoch": 10.0,
   "eval_steps": 500,
+  "global_step": 1990,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 12.032,
       "eval_steps_per_second": 6.016,
       "step": 1791
+    },
+    {
+      "epoch": 10.0,
+      "eval_accuracy": 0.7679355783308931,
+      "eval_loss": 1.8216043710708618,
+      "eval_runtime": 170.3389,
+      "eval_samples_per_second": 8.019,
+      "eval_steps_per_second": 4.01,
+      "step": 1990
     }
   ],
   "logging_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 2.95568855112096e+16,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null