Training in progress, step 75, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7dc66795d94cfdc9fa0478447c0ae9a43784dec074a53df26bc2e160ef687199
 size 83945296

 version https://git-lfs.github.com/spec/v1
+oid sha256:11e42786d49cfe41cfcaa54d5091ee6e85eeaff37d1a87d017da8498e1f1156f
 size 83945296

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1f2c8a8aeae6258956ce5b950ff0aebe12996f2ab918b7a6127893b67fd0586f
 size 42545748

 version https://git-lfs.github.com/spec/v1
+oid sha256:1693edb689091d1d86be591036d1ecbf67b627bcf824db2357c4dbe37a987704
 size 42545748

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:557e474a226d303e26d6758a2eb18bb0bbe3b1a451146f9953c40e79b727f273
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:2a2343c093429d43a756778ff280bf9733e4758b7f37beec7554cba6baaf362e
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ca1e7c31f034aff02934fb59782ccef2d42f2b76452335ba79106ad1a626b6c
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:babd43118aa66a4f5266d730539cf7f09611158b169d9e63dbcb83f6bbaa8626
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.028,
   "eval_steps": 1000,
-  "global_step": 70,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -427,13 +427,43 @@
       "learning_rate": 1.388888888888889e-05,
       "loss": 1.7016,
       "step": 70
     }
   ],
   "logging_steps": 1,
   "max_steps": 75,
   "num_train_epochs": 1,
   "save_steps": 5,
-  "total_flos": 4233108315045888.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.03,
   "eval_steps": 1000,
+  "global_step": 75,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.388888888888889e-05,
       "loss": 1.7016,
       "step": 70
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 1.1111111111111112e-05,
+      "loss": 2.2515,
+      "step": 71
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 8.333333333333334e-06,
+      "loss": 2.047,
+      "step": 72
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 5.555555555555556e-06,
+      "loss": 1.3849,
+      "step": 73
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 2.777777777777778e-06,
+      "loss": 1.4436,
+      "step": 74
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 0.0,
+      "loss": 1.6971,
+      "step": 75
     }
   ],
   "logging_steps": 1,
   "max_steps": 75,
   "num_train_epochs": 1,
   "save_steps": 5,
+  "total_flos": 4668793953730560.0,
   "trial_name": null,
   "trial_params": null
 }