Training in progress, step 600000

Browse files

Files changed (13) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4bd1f4862280bc4f9f20cf61fc91f853df59d4ca3541b026db7600611b178d50
 size 893441093

 version https://git-lfs.github.com/spec/v1
+oid sha256:3011d318834eca8ab53dbb6676157bffa205e38d5b1da950aa905371e910e8ab
 size 893441093

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e98866b99e3ecd40c53531087e5d2e3191cf9fd862f418f5c2164fc106076e1
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd1db57f69735f18b491ceac5dcc53e66fc033f8278840d48a2d1d7789a922a3
 size 449450757

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ab3dcf04e4677cd69d3fbe91cb1ae1601851f3937f4fd0e788d25fd8dd5a9a5c
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:6d5ef830797817d960f06c7d56a345ac3affb87d9629b56b5bc8c9c3338bb01c
 size 14583

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6068ed85b429651ab3dcdb9d8c131e8794f545bafa654289904ead8dcf71a796
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:53e8adf2ea40b3fc922a7d11d4e61b79f1bf2e372d1d097107cce4c6dc566b51
 size 14583

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96d9c6af477a0b5f695c5b258b6a01aca5fc7cfa2d38303757339b849dbd7d3e
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:198286929a9142846ad67730b33946ccbc3ba475f115c3a0aef90b3b51ce6035
 size 14583

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:567a88294b09dd010f920f0bbc226b5e5f9189a07eafb2d3246224b7bdd85b03
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:03eebf4a4ea0cd9321666974d21bc38214f697b5e4b4b439941abd6a346b886d
 size 14583

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:56ebaee321096ea2774b004b42a63721b74b8260bf65ca91c67dcab0fe39ddf6
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:b03692cd1ad26b8eef58c8c71c41233d4ef014e517e327f8e4798a79a3642d38
 size 14583

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:400b8eee678f22dae7d12f6670127ef9e783a9bd2487ab20a30cddd0d1ae18fc
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:4840589ea9729ad2c28a92a929b64277e6de332cdd873f9187cab513a624b326
 size 14583

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ace2fdb32ece5ddc2b6164c2a1d1ed057e126355e32ac6d8db09bc2cd476da7
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:b1d4e4a138e230b3265d7fc7f258a4846b3b6af6bce4e94e22abcfe742c12213
 size 14583

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:90d67e927134f71d028c643f8c9e8a2e214f618d0796c97003c322009d54ac2a
 size 14583

 version https://git-lfs.github.com/spec/v1
+oid sha256:d7cc50ebf91016fa727fad392dd121c0404733da11c9da06aed7a47a81b65900
 size 14583

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4c3d2e37603fc85abdaa1469887efb3190e7c384dc663afb9c8011e46abae231
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:b1317449e5c457cd18ac6087cac07774393562aa747fda3bc1ae1eb6a47f1311
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.1794385872324773,
-  "global_step": 590000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -7086,11 +7086,131 @@
       "learning_rate": 6.506902584793773e-05,
       "loss": 0.3043,
       "step": 590000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
-  "total_flos": 3.988811683155628e+22,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.1994290717618414,
+  "global_step": 600000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 6.506902584793773e-05,
       "loss": 0.3043,
       "step": 590000
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 6.495596703323214e-05,
+      "loss": 0.3039,
+      "step": 590500
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 6.484294934833822e-05,
+      "loss": 0.3042,
+      "step": 591000
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 6.472997310224204e-05,
+      "loss": 0.304,
+      "step": 591500
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 6.461703860381628e-05,
+      "loss": 0.3039,
+      "step": 592000
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 6.450414616181959e-05,
+      "loss": 0.3041,
+      "step": 592500
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.439129608489559e-05,
+      "loss": 0.3043,
+      "step": 593000
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.427848868157208e-05,
+      "loss": 0.3041,
+      "step": 593500
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.41657242602602e-05,
+      "loss": 0.304,
+      "step": 594000
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.405300312925353e-05,
+      "loss": 0.3044,
+      "step": 594500
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.39403255967274e-05,
+      "loss": 0.304,
+      "step": 595000
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.382769197073783e-05,
+      "loss": 0.3042,
+      "step": 595500
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.371510255922088e-05,
+      "loss": 0.3041,
+      "step": 596000
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.360255766999172e-05,
+      "loss": 0.3036,
+      "step": 596500
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.349005761074372e-05,
+      "loss": 0.3044,
+      "step": 597000
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 6.33776026890478e-05,
+      "loss": 0.3038,
+      "step": 597500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.326519321235139e-05,
+      "loss": 0.3036,
+      "step": 598000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.315282948797776e-05,
+      "loss": 0.3033,
+      "step": 598500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.304051182312496e-05,
+      "loss": 0.3034,
+      "step": 599000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.292824052486525e-05,
+      "loss": 0.3036,
+      "step": 599500
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 6.281601590014407e-05,
+      "loss": 0.3039,
+      "step": 600000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 2,
+  "total_flos": 4.056420774973463e+22,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e98866b99e3ecd40c53531087e5d2e3191cf9fd862f418f5c2164fc106076e1
 size 449450757

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd1db57f69735f18b491ceac5dcc53e66fc033f8278840d48a2d1d7789a922a3
 size 449450757