Training in progress, epoch 9, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8449c4ae7d212a97a024e7742d0eb6425352aa9e246e8e7bdc9a4e1d4a02e23e
 size 1476713628

 version https://git-lfs.github.com/spec/v1
+oid sha256:5694a7255cc1234b09e13f63a12b42d96f34e32f40a5cbc560987864b913faf4
 size 1476713628

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1870ecc5515ed63dc03a4b33b6d8d27cd2ca8a6689b9db074de7016f6dc7f61a
 size 2953659629

 version https://git-lfs.github.com/spec/v1
+oid sha256:69d3ffe768c399a428e1319e382826c8136c7462cb28bde5e99a1d8d41b10757
 size 2953659629

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ff5818d57c272941dc6f306de2dfd7967ba52b362d6b269745887120fb80364
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:104accde398aea5178b47634f177e17064714f138801ca956369778c71ddfcaa
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9724b84ede32733f55a1e267adf046dff43ccd7ab501903c4975574b019c6b4c
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:a66bc7346a88fe9fe198bcb7770fa48175a412d9d55edf8c37c58498b9538d78
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 0.7364568081991215,
   "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-447",
-  "epoch": 8.984924623115578,
   "eval_steps": 500,
-  "global_step": 447,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -88,6 +88,15 @@
       "eval_samples_per_second": 26.42,
       "eval_steps_per_second": 3.307,
       "step": 447
     }
   ],
   "logging_steps": 500,
@@ -102,12 +111,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 2.660119696008864e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 0.7364568081991215,
   "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-447",
+  "epoch": 9.849246231155778,
   "eval_steps": 500,
+  "global_step": 490,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 26.42,
       "eval_steps_per_second": 3.307,
       "step": 447
+    },
+    {
+      "epoch": 9.849246231155778,
+      "eval_accuracy": 0.7306002928257687,
+      "eval_loss": 0.6873601675033569,
+      "eval_runtime": 51.5519,
+      "eval_samples_per_second": 26.498,
+      "eval_steps_per_second": 3.317,
+      "step": 490
     }
   ],
   "logging_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 2.91113043225984e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null