Training in progress, step 810000

Browse files

Files changed (13) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a28142d72c1a639c002962982eef85320960aec72ba5875c70ba183bc4428b1
 size 893441093

 version https://git-lfs.github.com/spec/v1
+oid sha256:c4d687ddbdb4e89fc2dcf4a1194021793a9bf6bf7cb019db9f4960ca46caec57
 size 893441093

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce05dc3d2487d7ae9aa6b0c59ea7f4616a5a7c54ca64071fd6c540348ab08786
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ec87ec32fe6f1afb99642886552d48e3abf86b7380d88757c48489a6974eadf
 size 449450757

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81c65759179a0409080d1617c50ff7701ce92dbb64fc3e317b9b62050537c3c7
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:e09a2f5687d865e3c781f2165eefcb1856cc3c45b89b03d8a7d88cfa59107bfb
 size 14583

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:44a3c67c522ab27350032a90eb3d95a3dabd1324000cbd2835b62067512227df
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:acb039c0d2f72216fce3d8d73be28207294bda5cfc4474547820110b11abd2a8
 size 14583

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d08d861261452452fd94fae84216cedf28f7702bcc30b7c349d5fe92376b24f
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:5adc671b102c788828dd37ee1d0f0b0a03c77bb3d279f123bf2cbe3d6d5cd23e
 size 14583

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68acbc45c81b60f69d2a54d496b38309d0cdcd82a52bd9be2a013dfa91b5b790
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:8116bccf5ca568ceb54edc4c2f036f266c94ac035ff894ed751446d6238c146f
 size 14583

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f7bd01ddf08fc5e563abc90c1bcd231f2103e9ae4cae190ae9888d8dbb7258d1
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:4decc89420866c9caffa620eb043d2f83ba7fe11eee6e3e9db617a680a5e3419
 size 14583

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:294721238c7a8c697c0dc55ae3f4c4580f7fc2de42c41858980ea55e897cb68b
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3ecec9a0f4bcccdee7615b55d893bdd755c9846b4db2c967eb5630e87ff3741
 size 14583

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a269e37b31e512e59995e2d8559babba1725032fdbd7ed2e8cd2d1c9cdf42315
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:f7819877f3abe602d4d64d7ac8cdc0b37ac08d27db902f3ca861703ead38253c
 size 14583

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5ada5eca471a55afc26d1f38512d1163ebd3e62514e19a602711641b70fa1cc7
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:c95826cc93c68dd743486cd9578bd00eeec47504d8a825d434c0d8b522697126
 size 14583

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc1b9455cfc1cc0d89898dcc5885e6586d120f989c1d84c4e74dce29a1aeae31
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:311a816d2396f8ee752cab7a1a3a8667609453373ab7e8b0474b724f8acc447d
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.1395078164236574,
-  "global_step": 800000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -9606,11 +9606,131 @@
       "learning_rate": 2.476016434225246e-05,
       "loss": 0.2901,
       "step": 800000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
-  "total_flos": 5.4085624444111735e+22,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.1594375044841798,
+  "global_step": 810000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.476016434225246e-05,
       "loss": 0.2901,
       "step": 800000
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 2.4689149133701672e-05,
+      "loss": 0.2905,
+      "step": 800500
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 2.461828514290513e-05,
+      "loss": 0.2898,
+      "step": 801000
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 2.4547572563602267e-05,
+      "loss": 0.2903,
+      "step": 801500
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 2.447701158911855e-05,
+      "loss": 0.2898,
+      "step": 802000
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 2.4406602412365027e-05,
+      "loss": 0.2898,
+      "step": 802500
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.4336345225837658e-05,
+      "loss": 0.2902,
+      "step": 803000
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.4266240221616956e-05,
+      "loss": 0.2905,
+      "step": 803500
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.4196287591367296e-05,
+      "loss": 0.2897,
+      "step": 804000
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.412648752633649e-05,
+      "loss": 0.2898,
+      "step": 804500
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.405684021735527e-05,
+      "loss": 0.2898,
+      "step": 805000
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.39873458548367e-05,
+      "loss": 0.2895,
+      "step": 805500
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.3918004628775736e-05,
+      "loss": 0.2897,
+      "step": 806000
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.3848816728748643e-05,
+      "loss": 0.2897,
+      "step": 806500
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.3779782343912463e-05,
+      "loss": 0.2888,
+      "step": 807000
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 2.3710901663004604e-05,
+      "loss": 0.29,
+      "step": 807500
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.364217487434221e-05,
+      "loss": 0.2895,
+      "step": 808000
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.3573602165821668e-05,
+      "loss": 0.2899,
+      "step": 808500
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.3505183724918196e-05,
+      "loss": 0.2897,
+      "step": 809000
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.3436919738685132e-05,
+      "loss": 0.29,
+      "step": 809500
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.3368810393753687e-05,
+      "loss": 0.2895,
+      "step": 810000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
+  "total_flos": 5.476171643101538e+22,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce05dc3d2487d7ae9aa6b0c59ea7f4616a5a7c54ca64071fd6c540348ab08786
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ec87ec32fe6f1afb99642886552d48e3abf86b7380d88757c48489a6974eadf
 size 449450757