Training in progress, step 6468

Files changed (6) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2001a2a8d146bbc3210e2ba74909a6c54a34bc0f57ecb371f3a4fdf527c02b9d
 size 133863493

 version https://git-lfs.github.com/spec/v1
+oid sha256:3cd9ed599b2622be6183702891ab47ac5b9f5406d312cb802b16ed7f3098d9cf
 size 133863493

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1faeff0083195d9b234e601d177b81e0e8b95814a0bfb980ed3d9c20fa193536
 size 266276525

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f92d3d52cf47be1987752bc89ccb1ec1c6e0dc8b68b55de2fed88e49ded0e92
 size 266276525

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa0b772b5dd21989336ffb42562e16185bc2e1d10a7ccdcb65ed21eb3e033e8e
 size 14511

 version https://git-lfs.github.com/spec/v1
+oid sha256:edec1b2f1f61c07d3b95c625533890e74aa6568913f1c7d51a65585f79b1d35e
 size 14511

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:874b5d38d8e13a97c857fe192fe23456e3dd1f5254d9ee7767049f04c81795a2
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c3ed672465d4250f40b2ef2e23b0eb90ec6136a6bc9ed10c02bf3f9c750c79e
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.4500835034329189,
-  "global_step": 4851,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -60,11 +60,29 @@
       "learning_rate": 2.195833505288551e-05,
       "loss": 0.1404,
       "step": 4500
     }
   ],
   "max_steps": 32334,
   "num_train_epochs": 3,
-  "total_flos": 8.225711749398528e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.6001113379105586,
+  "global_step": 6468,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.195833505288551e-05,
       "loss": 0.1404,
       "step": 4500
+    },
+    {
+      "epoch": 0.46,
+      "learning_rate": 2.156388339209501e-05,
+      "loss": 0.1381,
+      "step": 5000
+    },
+    {
+      "epoch": 0.51,
+      "learning_rate": 2.116943173130451e-05,
+      "loss": 0.136,
+      "step": 5500
+    },
+    {
+      "epoch": 0.56,
+      "learning_rate": 2.077498007051401e-05,
+      "loss": 0.135,
+      "step": 6000
     }
   ],
   "max_steps": 32334,
   "num_train_epochs": 3,
+  "total_flos": 1.0967615665864704e+17,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1faeff0083195d9b234e601d177b81e0e8b95814a0bfb980ed3d9c20fa193536
 size 266276525

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f92d3d52cf47be1987752bc89ccb1ec1c6e0dc8b68b55de2fed88e49ded0e92
 size 266276525