Training in progress, step 850000

Browse files

Files changed (13) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2f81c933b26cfeb60d53ba82d975294e2c7358973e2715677db9ca7fd31945d
 size 893441093

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e84ef55f585409a7eb44e502edc32a6f98749bb849f76b8b16d08a3dc37d8ae
 size 893441093

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:80793dabaaad0486a9c6c7d32363ba477ae4d785ddabb640496bf016359dc491
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:4a461e16ba87e1e69720d854eafd25f8ca62064d88d546c07f46eddd6113b782
 size 449450757

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c09ff3d1788e565e5a086e252ccf0ede212b045e4e5f4392a44c6ea6f0987dd6
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:8ac44739d68ab8d92ea75cbaa95e05b08c8692ab1a77edef6cb58ac613b56151
 size 14583

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e058e2238a38cee98eacc9109fd883ace95c4833f253ace4bd37e2704c0fe5af
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:1df68ed20ea8916573dab6835f47431337c9ff47e9296153749cafb56a0237a7
 size 14583

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9431567146b6a803c38f6863bbd8c9115e688967dc8f725b32605962fde389b3
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:77f291c8b37b0aa8ca2df1a663842fb970bdeff54c0b2afea5e2500f1ec3c566
 size 14583

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65f8725dca368138ac60071ebf1967a52a0bdc41ecaaff24531fe8b99b9ccb52
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:21eb46d9347a0d809f89248620dfe17276a72e359d7ca7fa7d35b0bd105aa105
 size 14583

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2eda6d197ffa3fe6958e94125c5fa0490a4afe5ac2f8a51ad2a4931b09364f04
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:351c206e5b3b4ed149381ec4e0dbf48f45d70d99336ae5535af82fc3c087c11c
 size 14583

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa3a1be70ad51e1c8a5b547f1989a2e92d51a9ec27c3a4490875ff9354ff3dda
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:5aa383878cd306edcfd23540112b984f51a1f84d02ae2848e2f7b0c8c85af935
 size 14583

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bc51de7c0af3e5027c4a852a232459cf39ee9a71ea51b7603a1f5327ee5a020
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:63948dedd46aa19ac12a8709dee2f12fa168b63bee773e75612f1919ff39b2f0
 size 14583

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e4a63b1c76ff6ed1a203a2dff4664ff326fc59ea9cbb507ef4f3897d7810fb84
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ec45b14f87f8f42299fc33d4fabbcc588674c41ff3399499af6ac36481288d5
 size 14583

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:90777e10c619a178822dbd35785dbd74396ff21ef94c6855b7e97b44a2c700b9
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:208c2830fa39459dcf60f5b94c27151cbc48e3dc8fdf884186b8d5be230917b9
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.2192265686657473,
-  "global_step": 840000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -10086,11 +10086,131 @@
       "learning_rate": 1.9572046332969825e-05,
       "loss": 0.2881,
       "step": 840000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
-  "total_flos": 5.678984079326211e+22,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.2391562567262697,
+  "global_step": 850000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.9572046332969825e-05,
       "loss": 0.2881,
       "step": 840000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.95137059427344e-05,
+      "loss": 0.2884,
+      "step": 840500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.945553091971727e-05,
+      "loss": 0.2883,
+      "step": 841000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.93975214229667e-05,
+      "loss": 0.2885,
+      "step": 841500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.933967761107847e-05,
+      "loss": 0.2877,
+      "step": 842000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.928199964219533e-05,
+      "loss": 0.2876,
+      "step": 842500
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.9224487674006694e-05,
+      "loss": 0.2873,
+      "step": 843000
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.9167141863748015e-05,
+      "loss": 0.288,
+      "step": 843500
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.9109962368200602e-05,
+      "loss": 0.2874,
+      "step": 844000
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.9052949343690977e-05,
+      "loss": 0.2884,
+      "step": 844500
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.8996102946090586e-05,
+      "loss": 0.2874,
+      "step": 845000
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.8939423330815345e-05,
+      "loss": 0.2879,
+      "step": 845500
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.888291065282509e-05,
+      "loss": 0.2872,
+      "step": 846000
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.882656506662338e-05,
+      "loss": 0.2882,
+      "step": 846500
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.8770386726256865e-05,
+      "loss": 0.2875,
+      "step": 847000
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.8714375785315006e-05,
+      "loss": 0.2871,
+      "step": 847500
+    },
+    {
+      "epoch": 1.24,
+      "learning_rate": 1.8658532396929565e-05,
+      "loss": 0.2872,
+      "step": 848000
+    },
+    {
+      "epoch": 1.24,
+      "learning_rate": 1.8602856713774208e-05,
+      "loss": 0.2874,
+      "step": 848500
+    },
+    {
+      "epoch": 1.24,
+      "learning_rate": 1.8547348888064178e-05,
+      "loss": 0.2869,
+      "step": 849000
+    },
+    {
+      "epoch": 1.24,
+      "learning_rate": 1.8492009071555703e-05,
+      "loss": 0.2873,
+      "step": 849500
+    },
+    {
+      "epoch": 1.24,
+      "learning_rate": 1.8436837415545772e-05,
+      "loss": 0.2874,
+      "step": 850000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
+  "total_flos": 5.746589779150674e+22,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:80793dabaaad0486a9c6c7d32363ba477ae4d785ddabb640496bf016359dc491
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:4a461e16ba87e1e69720d854eafd25f8ca62064d88d546c07f46eddd6113b782
 size 449450757