Training in progress, step 610000

Browse files

Files changed (13) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3011d318834eca8ab53dbb6676157bffa205e38d5b1da950aa905371e910e8ab
 size 893441093

 version https://git-lfs.github.com/spec/v1
+oid sha256:34fa3fbc162567eded2c54001cc8f21167119645a7ad5d9438d4d6580d7e0aaf
 size 893441093

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dd1db57f69735f18b491ceac5dcc53e66fc033f8278840d48a2d1d7789a922a3
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:eb7fc5d60355a8dfd752019852cdb15ae9d272ab89ceb9fe9acfccaaa3393cce
 size 449450757

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6d5ef830797817d960f06c7d56a345ac3affb87d9629b56b5bc8c9c3338bb01c
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:bd344a2f09d330c943a3dd3d04668fe450de22ee225e64c890f4722c7155791f
 size 14583

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53e8adf2ea40b3fc922a7d11d4e61b79f1bf2e372d1d097107cce4c6dc566b51
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:7587b2027544c125ad8875c396124abeaa8b26e560f514a758d79f5c77d1245e
 size 14583

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:198286929a9142846ad67730b33946ccbc3ba475f115c3a0aef90b3b51ce6035
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:b98e6e4730ae83aa0bbaf43b6a70f2dbea908df991dba53b4ba6b61ef5a4bc51
 size 14583

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:03eebf4a4ea0cd9321666974d21bc38214f697b5e4b4b439941abd6a346b886d
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:3fae6c192050786077eb0c3ad856996ecc90d4abf868828c40917e34e278ddf8
 size 14583

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b03692cd1ad26b8eef58c8c71c41233d4ef014e517e327f8e4798a79a3642d38
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:04edc224f8d5fe4b319f5145ba3be953f45d1403c8d037fe0f2d7e1df55860c5
 size 14583

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4840589ea9729ad2c28a92a929b64277e6de332cdd873f9187cab513a624b326
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:6fd673ae46299e38ec0092baeee3dfcef9b18e2fdce8cd906ed6e5311b6eb2f0
 size 14583

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1d4e4a138e230b3265d7fc7f258a4846b3b6af6bce4e94e22abcfe742c12213
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:ba46334d5cfb098826b8bc46bdfd08caddd05dd0a2ad976845aaf16ed9488107
 size 14583

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7cc50ebf91016fa727fad392dd121c0404733da11c9da06aed7a47a81b65900
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:071dfcafc848e779fb2959117671810686f513947ddff515a5f53d88a149a7ef
 size 14583

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1317449e5c457cd18ac6087cac07774393562aa747fda3bc1ae1eb6a47f1311
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:1451fdba239492a726627053577a5d97726556e48bcec30f5b94d6df5305247b
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.1994290717618414,
-  "global_step": 600000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -7206,11 +7206,131 @@
       "learning_rate": 6.281601590014407e-05,
       "loss": 0.3039,
       "step": 600000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
-  "total_flos": 4.056420774973463e+22,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.2194195562912054,
+  "global_step": 610000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 6.281601590014407e-05,
       "loss": 0.3039,
       "step": 600000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.270383825577923e-05,
+      "loss": 0.3039,
+      "step": 600500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.259170789846017e-05,
+      "loss": 0.3034,
+      "step": 601000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.247962513474697e-05,
+      "loss": 0.3039,
+      "step": 601500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.236759027106965e-05,
+      "loss": 0.3035,
+      "step": 602000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.225560361372722e-05,
+      "loss": 0.3034,
+      "step": 602500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.214366546888694e-05,
+      "loss": 0.3045,
+      "step": 603000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.203177614258345e-05,
+      "loss": 0.3031,
+      "step": 603500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.191993594071785e-05,
+      "loss": 0.3039,
+      "step": 604000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.180814516905701e-05,
+      "loss": 0.3068,
+      "step": 604500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.169640413323262e-05,
+      "loss": 0.3035,
+      "step": 605000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.158471313874041e-05,
+      "loss": 0.3027,
+      "step": 605500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.147307249093929e-05,
+      "loss": 0.3039,
+      "step": 606000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.136148249505053e-05,
+      "loss": 0.3037,
+      "step": 606500
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.124994345615693e-05,
+      "loss": 0.3034,
+      "step": 607000
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 6.113845567920194e-05,
+      "loss": 0.3033,
+      "step": 607500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 6.102701946898891e-05,
+      "loss": 0.3041,
+      "step": 608000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 6.0915635130180154e-05,
+      "loss": 0.3027,
+      "step": 608500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 6.0804302967296225e-05,
+      "loss": 0.3028,
+      "step": 609000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 6.0693023284715e-05,
+      "loss": 0.3031,
+      "step": 609500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 6.058179638667089e-05,
+      "loss": 0.3027,
+      "step": 610000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
+  "total_flos": 4.124028700869167e+22,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dd1db57f69735f18b491ceac5dcc53e66fc033f8278840d48a2d1d7789a922a3
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:eb7fc5d60355a8dfd752019852cdb15ae9d272ab89ceb9fe9acfccaaa3393cce
 size 449450757