Training in progress, step 820000

Browse files

Files changed (13) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c4d687ddbdb4e89fc2dcf4a1194021793a9bf6bf7cb019db9f4960ca46caec57
 size 893441093

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb7fd5efb2ff87d094795926832b73ee7aa1e6614b8bfcc85208c1fac61c542d
 size 893441093

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ec87ec32fe6f1afb99642886552d48e3abf86b7380d88757c48489a6974eadf
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:3dd2e6a7da537ff760743918bcaefe9c986fc2c76a2e5c7636f4801ac5b5cd7b
 size 449450757

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e09a2f5687d865e3c781f2165eefcb1856cc3c45b89b03d8a7d88cfa59107bfb
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:0609e713a668aa906084c6d7021e86eb2ccb60af4342d1b4397b833b19fbbc89
 size 14583

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:acb039c0d2f72216fce3d8d73be28207294bda5cfc4474547820110b11abd2a8
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:3592882666e2655598af900b2cb26f9f1ba0f86a99376f61e0440aabceaa6a07
 size 14583

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5adc671b102c788828dd37ee1d0f0b0a03c77bb3d279f123bf2cbe3d6d5cd23e
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ca8c6c74101f99bae3f401fe7213e04d3ffd2cde1efe24238143ecf20918b53
 size 14583

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8116bccf5ca568ceb54edc4c2f036f266c94ac035ff894ed751446d6238c146f
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:8a67149e6f2c803c5510419511ac904f9537eb4fbff5066e666ed08b44f9664f
 size 14583

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4decc89420866c9caffa620eb043d2f83ba7fe11eee6e3e9db617a680a5e3419
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e59f03ce343bc2279a4caef20772b97445f7cad5f56f03c6fe562ef9297aba5
 size 14583

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f3ecec9a0f4bcccdee7615b55d893bdd755c9846b4db2c967eb5630e87ff3741
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:49b75ef2c8e55abd504706b58ef3e0a8e29500c910d22cedece78b4bbdd0c43a
 size 14583

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f7819877f3abe602d4d64d7ac8cdc0b37ac08d27db902f3ca861703ead38253c
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a3e48ab19d013994e76ce74871eebcf792a7f0de0b1bc5e31a34b55c3911660
 size 14583

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c95826cc93c68dd743486cd9578bd00eeec47504d8a825d434c0d8b522697126
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:83f313ad3307a61df4799cc55bebfd321f79a2d67e43e4af68c3ea5f2e8a2721
 size 14583

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:311a816d2396f8ee752cab7a1a3a8667609453373ab7e8b0474b724f8acc447d
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:735207f6708877a90cb07d7ba5bda4e331561a0f2cd24f0dff22c21fa9a1d464
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.1594375044841798,
-  "global_step": 810000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -9726,11 +9726,131 @@
       "learning_rate": 2.3368810393753687e-05,
       "loss": 0.2895,
       "step": 810000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
-  "total_flos": 5.476171643101538e+22,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.1793671925447022,
+  "global_step": 820000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.3368810393753687e-05,
       "loss": 0.2895,
       "step": 810000
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.3300855876332162e-05,
+      "loss": 0.2894,
+      "step": 810500
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.32330563722056e-05,
+      "loss": 0.2896,
+      "step": 811000
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.316541206673529e-05,
+      "loss": 0.2896,
+      "step": 811500
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.309792314485815e-05,
+      "loss": 0.2895,
+      "step": 812000
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 2.3030589791086353e-05,
+      "loss": 0.2893,
+      "step": 812500
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2963412189506695e-05,
+      "loss": 0.2893,
+      "step": 813000
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2896390523780156e-05,
+      "loss": 0.2894,
+      "step": 813500
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.282952497714145e-05,
+      "loss": 0.2894,
+      "step": 814000
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2762815732398387e-05,
+      "loss": 0.2896,
+      "step": 814500
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2696262971931538e-05,
+      "loss": 0.2891,
+      "step": 815000
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2629866877693577e-05,
+      "loss": 0.2892,
+      "step": 815500
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2563627631208887e-05,
+      "loss": 0.2892,
+      "step": 816000
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2497545413573065e-05,
+      "loss": 0.2902,
+      "step": 816500
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.2431620405452336e-05,
+      "loss": 0.2889,
+      "step": 817000
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 2.23658527870832e-05,
+      "loss": 0.2892,
+      "step": 817500
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 2.230024273827179e-05,
+      "loss": 0.2885,
+      "step": 818000
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 2.223479043839345e-05,
+      "loss": 0.2888,
+      "step": 818500
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 2.216949606639231e-05,
+      "loss": 0.2892,
+      "step": 819000
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 2.2104359800780665e-05,
+      "loss": 0.2885,
+      "step": 819500
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 2.2039381819638596e-05,
+      "loss": 0.2894,
+      "step": 820000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
+  "total_flos": 5.543772678797676e+22,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ec87ec32fe6f1afb99642886552d48e3abf86b7380d88757c48489a6974eadf
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:3dd2e6a7da537ff760743918bcaefe9c986fc2c76a2e5c7636f4801ac5b5cd7b
 size 449450757