Training in progress, step 500, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1c47212017af1d1890422725962f2f60e0630141c69c87c0f307cb0f6c9fd9a1
 size 67143296

 version https://git-lfs.github.com/spec/v1
+oid sha256:8641639f36d2017cd3be1c77d3de39c47ab3545ed6cdf0ef30eafe1db1dca62e
 size 67143296

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8fdb34b5032791db249965fe2cb89cd69e01769c1856d0a422fea22e2d6b103
 size 33920095

 version https://git-lfs.github.com/spec/v1
+oid sha256:44e354b2b9a397b20dbba46c4d4bd8056e9c164df5588f0377d09afe9a838825
 size 33920095

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:036fe95b6a14168d369a32ce869914bf19a1cf115c749866d43c0dbc23f4fc3c
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ec45735acf0d21a6a13a33353b33cadb4eb3f9c802c936af55a3f5542ea95b3
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d5e88c363c3a1a500cd49caa98c7b1302e3233ffa1415f85f0e1a36caffee951
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:1352cee7a141eadc0dec5a54fb0352c24d3de0192e8f627a38660bb21a3c14e2
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.4390243902439024,
   "eval_steps": 100,
-  "global_step": 400,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -59,13 +59,26 @@
       "eval_samples_per_second": 2.038,
       "eval_steps_per_second": 0.266,
       "step": 400
     }
   ],
   "logging_steps": 100,
   "max_steps": 1312,
   "num_train_epochs": 8,
   "save_steps": 100,
-  "total_flos": 3.322448287314739e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.048780487804878,
   "eval_steps": 100,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 2.038,
       "eval_steps_per_second": 0.266,
       "step": 400
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 0.0002,
+      "loss": 0.0777,
+      "step": 500
+    },
+    {
+      "epoch": 3.05,
+      "eval_runtime": 33.8767,
+      "eval_samples_per_second": 2.037,
+      "eval_steps_per_second": 0.266,
+      "step": 500
     }
   ],
   "logging_steps": 100,
   "max_steps": 1312,
   "num_train_epochs": 8,
   "save_steps": 100,
+  "total_flos": 4.151500035902669e+16,
   "trial_name": null,
   "trial_params": null
 }