Training in progress, step 1000, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c29fe4a0133197cda139441a6bba43ba30a0a16566dcea0b7516ede214fd5573
 size 161533160

 version https://git-lfs.github.com/spec/v1
+oid sha256:027c28cbacad0920c7a8ec1a4dbaf396f0658e37d9c57aa24903513cf568bf29
 size 161533160

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c5b38eb68908f60759797c8127974582cae417043d2969c2c60105311ef3ecf1
 size 323292202

 version https://git-lfs.github.com/spec/v1
+oid sha256:a811f08d635f9fd429d0ac8672eee899607dd871ece10f326b8ec3e7266d9db2
 size 323292202

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3492512c1ba7e98d86dc7e3d6cf87a55ddfe936908da4ab0ab28461f25075b9
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:824d4a418ca52dbceab02ca3bdda11d00d54b246084fd87a75671a28233a0cb2
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.1490066225165563,
   "eval_steps": 100,
-  "global_step": 900,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -150,6 +150,20 @@
       "learning_rate": 4.961368653421634e-05,
       "loss": 0.7661,
       "step": 900
     }
   ],
   "logging_steps": 50,
@@ -169,7 +183,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 7039716814749696.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.16556291390728478,
   "eval_steps": 100,
+  "global_step": 1000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 4.961368653421634e-05,
       "loss": 0.7661,
       "step": 900
+    },
+    {
+      "epoch": 0.15728476821192053,
+      "grad_norm": 2.3362715244293213,
+      "learning_rate": 5.237306843267108e-05,
+      "loss": 0.736,
+      "step": 950
+    },
+    {
+      "epoch": 0.16556291390728478,
+      "grad_norm": 1.8228410482406616,
+      "learning_rate": 5.513245033112583e-05,
+      "loss": 0.7213,
+      "step": 1000
     }
   ],
   "logging_steps": 50,
       "attributes": {}
     }
   },
+  "total_flos": 7833052747137024.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null