Training in progress, epoch 5, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bf7f1711371cdf22625cfd71373d0e13667f9262db729700ebba8bff281e302f
 size 6403448

 version https://git-lfs.github.com/spec/v1
+oid sha256:1e3dbdf3aa088737ce1cdad6ea130252698559d75de369f4db5b9d8dac0347ff
 size 6403448

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa22af2fc608eb3be5b6d7756926317b864996be333d25aedbb9e48d2d5bd10f
 size 12867066

 version https://git-lfs.github.com/spec/v1
+oid sha256:cf90bfc28626b9b635a21b6c7af37c270a72edf31a353533fd4ccef7270c5d23
 size 12867066

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a0a24216fd4977ce1d76fe035f83db58fced950e69f3285260aec3babc9a654
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:10e3856931a60333566c32feed9f656e65195d769bc3d7827e3d40c2fac2012a
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:492f28b6539849c91c4a713593f718b0248ba49625b6a14592a3de84ad5d56c7
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:d99598dae57d4b1975eeb0f5c3edb922a43a02c02fef0ccb682d848ccbb64cfa
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,10 +1,10 @@
 {
-  "best_global_step": 52,
-  "best_metric": 5.0411696434021,
-  "best_model_checkpoint": "My-Nietzsche-Model/checkpoint-52",
-  "epoch": 4.0,
   "eval_steps": 500,
-  "global_step": 52,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -40,6 +40,14 @@
       "eval_samples_per_second": 3.212,
       "eval_steps_per_second": 0.803,
       "step": 52
     }
   ],
   "logging_steps": 500,
@@ -54,12 +62,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 2494553191833600.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
+  "best_global_step": 65,
+  "best_metric": 5.032853603363037,
+  "best_model_checkpoint": "My-Nietzsche-Model/checkpoint-65",
+  "epoch": 5.0,
   "eval_steps": 500,
+  "global_step": 65,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 3.212,
       "eval_steps_per_second": 0.803,
       "step": 52
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 5.032853603363037,
+      "eval_runtime": 6.187,
+      "eval_samples_per_second": 3.233,
+      "eval_steps_per_second": 0.808,
+      "step": 65
     }
   ],
   "logging_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 3118191489792000.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null