Training in progress, step 840000

Browse files

Files changed (13) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ef1b487cabfa82f2f81ded5cef2d529a41a97f8137d750d66e05d443478e91a
 size 893441093

 version https://git-lfs.github.com/spec/v1
+oid sha256:b2f81c933b26cfeb60d53ba82d975294e2c7358973e2715677db9ca7fd31945d
 size 893441093

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b63e12b39341c1c8d25b10dc8ca07cde5e82303726c5b23ac1fdd24345f08c2a
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:80793dabaaad0486a9c6c7d32363ba477ae4d785ddabb640496bf016359dc491
 size 449450757

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:34241c46169d6140a8feca7f2e1db99ea6d7326e000406064ac61feecf3f17b2
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:c09ff3d1788e565e5a086e252ccf0ede212b045e4e5f4392a44c6ea6f0987dd6
 size 14583

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9fb4767c32ae0f5cf34a94816a959b9568b2ea2174c179de2a3df992017a5f77
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:e058e2238a38cee98eacc9109fd883ace95c4833f253ace4bd37e2704c0fe5af
 size 14583

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:efc0c6d968c43ae24dfc91f94bcca80995b7ed16b92115235f58d28e636291a4
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:9431567146b6a803c38f6863bbd8c9115e688967dc8f725b32605962fde389b3
 size 14583

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df72b23925eb5f82752cd028feed8cf7d2bbe1dbdf011029efc7554632b26ae2
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:65f8725dca368138ac60071ebf1967a52a0bdc41ecaaff24531fe8b99b9ccb52
 size 14583

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bd1259a368e737ba331fab7b54a98c7cfc3dd87ed455bcbc28503bda235c71d3
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:2eda6d197ffa3fe6958e94125c5fa0490a4afe5ac2f8a51ad2a4931b09364f04
 size 14583

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5f2eac6df5cd35dc068eb0bab0d362a924c2221b17b5c9bfe0e42f4ba3c05c9c
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:fa3a1be70ad51e1c8a5b547f1989a2e92d51a9ec27c3a4490875ff9354ff3dda
 size 14583

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e7f8260a2f4cc917f2e6b69683488cb603bdd620504afe136b5dc796247fcec
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bc51de7c0af3e5027c4a852a232459cf39ee9a71ea51b7603a1f5327ee5a020
 size 14583

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:41a93612851ee52955512369b8723183837a90f2506b353970cd64de58829b3d
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:e4a63b1c76ff6ed1a203a2dff4664ff326fc59ea9cbb507ef4f3897d7810fb84
 size 14583

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5bde979dd08e67682f748b136bdd4f7c962a7cebec495023e183c816b6c75933
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:90777e10c619a178822dbd35785dbd74396ff21ef94c6855b7e97b44a2c700b9
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.1992968806052247,
-  "global_step": 830000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -9966,11 +9966,131 @@
       "learning_rate": 2.0773332330534513e-05,
       "loss": 0.2887,
       "step": 830000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
-  "total_flos": 5.6113757283593115e+22,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.2192265686657473,
+  "global_step": 840000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.0773332330534513e-05,
       "loss": 0.2887,
       "step": 830000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 2.0711718689098057e-05,
+      "loss": 0.2886,
+      "step": 830500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 2.0650267139558772e-05,
+      "loss": 0.2887,
+      "step": 831000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 2.058897784992289e-05,
+      "loss": 0.2885,
+      "step": 831500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 2.052785098775293e-05,
+      "loss": 0.2886,
+      "step": 832000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 2.0466886720167436e-05,
+      "loss": 0.2877,
+      "step": 832500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.04060852138404e-05,
+      "loss": 0.2878,
+      "step": 833000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.0345446635000783e-05,
+      "loss": 0.2887,
+      "step": 833500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.028497114943219e-05,
+      "loss": 0.2888,
+      "step": 834000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.022465892247223e-05,
+      "loss": 0.2881,
+      "step": 834500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.0164510119012263e-05,
+      "loss": 0.2878,
+      "step": 835000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.0104524903496834e-05,
+      "loss": 0.2879,
+      "step": 835500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 2.0044703439923217e-05,
+      "loss": 0.2876,
+      "step": 836000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 1.998504589184101e-05,
+      "loss": 0.2879,
+      "step": 836500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 1.9925552422351654e-05,
+      "loss": 0.2878,
+      "step": 837000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 1.9866223194108028e-05,
+      "loss": 0.2884,
+      "step": 837500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.9807058369314016e-05,
+      "loss": 0.288,
+      "step": 838000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.9748058109723953e-05,
+      "loss": 0.2879,
+      "step": 838500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.968922257664231e-05,
+      "loss": 0.2878,
+      "step": 839000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.9630551930923155e-05,
+      "loss": 0.288,
+      "step": 839500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.9572046332969825e-05,
+      "loss": 0.2881,
+      "step": 840000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
+  "total_flos": 5.678984079326211e+22,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b63e12b39341c1c8d25b10dc8ca07cde5e82303726c5b23ac1fdd24345f08c2a
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:80793dabaaad0486a9c6c7d32363ba477ae4d785ddabb640496bf016359dc491
 size 449450757