Training in progress, step 45000

Browse files

Files changed (9) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +63 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:48ef65f375b5e59f1f5749f9b5d92b6593185c721625528eb784cce2ed02d68c
 size 202193937

 version https://git-lfs.github.com/spec/v1
+oid sha256:246faa74bee80665f358d5669008a0887cddb7b18e016fafe9dd7ea6316dd50e
 size 202193937

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65ddc0e4c8f4296ecd3c8937865a6a205702a67b3f399c44945e74c8eb7117ab
 size 102501541

 version https://git-lfs.github.com/spec/v1
+oid sha256:84e97a922c2788b9920a24141a5e48a7999f9bc8c2eff341a1e699714ef37106
 size 102501541

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e78893dd4244a47b1f0ec82be35592851bdbef7f0a2077ad84f084e71bbb0dc
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e78893dd4244a47b1f0ec82be35592851bdbef7f0a2077ad84f084e71bbb0dc
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e78893dd4244a47b1f0ec82be35592851bdbef7f0a2077ad84f084e71bbb0dc
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e78893dd4244a47b1f0ec82be35592851bdbef7f0a2077ad84f084e71bbb0dc
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
 size 14503

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c97de0675cb6398d3c3d756355dca4463427408f54efe4c22a7193c161dbf261
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b42368e9f62da349b2760579f9deddc87fbe7062743f1048a9d6bf6e1d86f64
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.6127685649726169,
-  "global_step": 40000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -486,11 +486,71 @@
       "learning_rate": 1.4975414512725056e-05,
       "loss": 0.0519,
       "step": 40000
     }
   ],
   "max_steps": 500000,
   "num_train_epochs": 8,
-  "total_flos": 6.38974277549e+20,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.689364635594194,
+  "global_step": 45000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.4975414512725056e-05,
       "loss": 0.0519,
       "step": 40000
+    },
+    {
+      "epoch": 0.62,
+      "learning_rate": 1.4973749622593532e-05,
+      "loss": 0.0518,
+      "step": 40500
+    },
+    {
+      "epoch": 0.63,
+      "learning_rate": 1.4972030340333e-05,
+      "loss": 0.0517,
+      "step": 41000
+    },
+    {
+      "epoch": 0.64,
+      "learning_rate": 1.4970256684745257e-05,
+      "loss": 0.0516,
+      "step": 41500
+    },
+    {
+      "epoch": 0.64,
+      "learning_rate": 1.4968428675226714e-05,
+      "loss": 0.0516,
+      "step": 42000
+    },
+    {
+      "epoch": 0.65,
+      "learning_rate": 1.4966546331768191e-05,
+      "loss": 0.0515,
+      "step": 42500
+    },
+    {
+      "epoch": 0.66,
+      "learning_rate": 1.4964609674954694e-05,
+      "loss": 0.0514,
+      "step": 43000
+    },
+    {
+      "epoch": 0.67,
+      "learning_rate": 1.4962618725965194e-05,
+      "loss": 0.0512,
+      "step": 43500
+    },
+    {
+      "epoch": 0.67,
+      "learning_rate": 1.496057350657239e-05,
+      "loss": 0.051,
+      "step": 44000
+    },
+    {
+      "epoch": 0.68,
+      "learning_rate": 1.4958474039142468e-05,
+      "loss": 0.0509,
+      "step": 44500
+    },
+    {
+      "epoch": 0.69,
+      "learning_rate": 1.4956320346634877e-05,
+      "loss": 0.0507,
+      "step": 45000
     }
   ],
   "max_steps": 500000,
   "num_train_epochs": 8,
+  "total_flos": 7.18846062242625e+20,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65ddc0e4c8f4296ecd3c8937865a6a205702a67b3f399c44945e74c8eb7117ab
 size 102501541

 version https://git-lfs.github.com/spec/v1
+oid sha256:84e97a922c2788b9920a24141a5e48a7999f9bc8c2eff341a1e699714ef37106
 size 102501541