Training in progress, step 4000

Files changed (8) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:633117411df249b67810ce444bf3fb43946a8cd66899354347e95f320178ff8d
 size 880446181

 version https://git-lfs.github.com/spec/v1
+oid sha256:0dbdc000392478004ae6d96779bf4278d1ef18251780930b9f3c799384f5bbf7
 size 880446181

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89123e2ca1e8f73e8549d0b72898b6506a9d8cab0ca3f0ddf2851992906d3212
 size 440235825

 version https://git-lfs.github.com/spec/v1
+oid sha256:542d1e98b1496a58397fda14504ca6f3da4a82106acb16e6eafe2d17041fd830
 size 440235825

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a8af43f49c567fc21216a636a0b928ad3f2b478713872cde9fab7fd2e5b3bd94
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:2a051295dd5bb8f79e33c3a2c94c1992b07d17d0b91ccf5450842b8cded54f3c
 size 14503

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:52671e748af9f02c099fe74fa17abb19dd5557da6aa5f91f903c19df101db345
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:d93f82e70bcd6a3d62cba6e3e991ff9feff4305521c6596bf00d78e8721b10d1
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.36450739429285567,
-  "global_step": 3500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -118,11 +118,27 @@
       "eval_samples_per_second": 91.822,
       "eval_steps_per_second": 11.48,
       "step": 3500
     }
   ],
   "max_steps": 28806,
   "num_train_epochs": 3,
-  "total_flos": 7316309188608000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.41657987919183503,
+  "global_step": 4000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 91.822,
       "eval_steps_per_second": 11.48,
       "step": 3500
+    },
+    {
+      "epoch": 0.42,
+      "learning_rate": 2.583420120808165e-05,
+      "loss": 0.8454,
+      "step": 4000
+    },
+    {
+      "epoch": 0.42,
+      "eval_exact_match": 65.8320292123109,
+      "eval_f1": 70.26703931597173,
+      "eval_loss": 0.6987438201904297,
+      "eval_runtime": 154.6403,
+      "eval_samples_per_second": 91.858,
+      "eval_steps_per_second": 11.485,
+      "step": 4000
     }
   ],
   "max_steps": 28806,
   "num_train_epochs": 3,
+  "total_flos": 8361496215552000.0,
   "trial_name": null,
   "trial_params": null
 }

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89123e2ca1e8f73e8549d0b72898b6506a9d8cab0ca3f0ddf2851992906d3212
 size 440235825

 version https://git-lfs.github.com/spec/v1
+oid sha256:542d1e98b1496a58397fda14504ca6f3da4a82106acb16e6eafe2d17041fd830
 size 440235825