Training in progress, step 150, checkpoint

Browse files

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +63 -3

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5700e75aedd836722315a2c637c8f75ca8370d0dfa88cc4580ff8fe5a9f37fa5
 size 75012288

 version https://git-lfs.github.com/spec/v1
+oid sha256:f49598723d8c65b7f6b5645c5a07f36db4679055c387465cb717c054f54d515e
 size 75012288

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:613aa481d37097de3af43e8bfa4a424fc42d0e26cc1f8774020cfe2b5bf15281
 size 38034724

 version https://git-lfs.github.com/spec/v1
+oid sha256:85bac65930f267247f044f6c70a029246ba89f8f917fe1796bf0c7621d66d613
 size 38034724

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54d19fc9cad9609a6172c82e6d0d91c418c97728872a9b499c73ea8cd6f52e82
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:2b8fb474d85aef0f57c5c82e36b87ff9ecbc12ff5a856d932e9b2940d26914d2
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:839736b31b97702e0c125f95929ada9032d07251504fab76843e29c8dc4d0fce
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:194456d3c9e165255d5406a0f3f62973b0bede79d91784f72431350783e27ae7
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.056,
   "eval_steps": 1000,
-  "global_step": 140,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -847,13 +847,73 @@
       "learning_rate": 1.360544217687075e-05,
       "loss": 1.9262,
       "step": 140
     }
   ],
   "logging_steps": 1,
   "max_steps": 150,
   "num_train_epochs": 1,
   "save_steps": 5,
-  "total_flos": 7515861863497728.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.06,
   "eval_steps": 1000,
+  "global_step": 150,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.360544217687075e-05,
       "loss": 1.9262,
       "step": 140
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 1.2244897959183674e-05,
+      "loss": 1.8739,
+      "step": 141
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 1.08843537414966e-05,
+      "loss": 1.8307,
+      "step": 142
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 9.523809523809523e-06,
+      "loss": 1.8247,
+      "step": 143
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 8.163265306122448e-06,
+      "loss": 1.8952,
+      "step": 144
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 6.802721088435375e-06,
+      "loss": 1.8041,
+      "step": 145
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 5.4421768707483e-06,
+      "loss": 1.8557,
+      "step": 146
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 4.081632653061224e-06,
+      "loss": 1.9398,
+      "step": 147
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 2.72108843537415e-06,
+      "loss": 1.944,
+      "step": 148
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 1.360544217687075e-06,
+      "loss": 2.0813,
+      "step": 149
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 0.0,
+      "loss": 1.8519,
+      "step": 150
     }
   ],
   "logging_steps": 1,
   "max_steps": 150,
   "num_train_epochs": 1,
   "save_steps": 5,
+  "total_flos": 8125557976793088.0,
   "trial_name": null,
   "trial_params": null
 }