Training in progress, step 2000

Files changed (8) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1e28797711c55f11393f39c4578ae5b2f8cae0b19bb836d6715c9d6208a82c12
 size 880446181

 version https://git-lfs.github.com/spec/v1
+oid sha256:720bfba664490a8f2978b90979bca9a5988d9147c93a193a44e284fbb4921d3f
 size 880446181

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a3f1e893c085069c4b611253e12a40c8bc225aa028961c76af0064dbc5f9d526
 size 440235825

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f3f8b5a9bc2011e7a17493450859f999dce5f00a17fb64c0dbf008775c474de
 size 440235825

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:83b5038fdf82168cf2fca5379cccaf30b16bd7c6f54f8cbb9850e2c41bdd8634
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:379cbeb5d54805b5fa9714b2986e68e902f40f6fb18b1f30a7f2c91094c1eeb2
 size 14503

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f225808d1fd8a2007ec116088248fd1e0fa6c9b4dcc13ad68eabc9e83d0e121
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:6141491e8bc35b45ecb10755fc870a0a9e5029d0796ad3f7838f1e51aa233036
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.15621745469693815,
-  "global_step": 1500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -54,11 +54,27 @@
       "eval_samples_per_second": 92.389,
       "eval_steps_per_second": 11.551,
       "step": 1500
     }
   ],
   "max_steps": 28806,
   "num_train_epochs": 3,
-  "total_flos": 3135561080832000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.20828993959591752,
+  "global_step": 2000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 92.389,
       "eval_steps_per_second": 11.551,
       "step": 1500
+    },
+    {
+      "epoch": 0.21,
+      "learning_rate": 2.7917100604040825e-05,
+      "loss": 0.9479,
+      "step": 2000
+    },
+    {
+      "epoch": 0.21,
+      "eval_exact_match": 57.21613632411754,
+      "eval_f1": 61.625922292628005,
+      "eval_loss": 0.7944296002388,
+      "eval_runtime": 153.833,
+      "eval_samples_per_second": 92.34,
+      "eval_steps_per_second": 11.545,
+      "step": 2000
     }
   ],
   "max_steps": 28806,
   "num_train_epochs": 3,
+  "total_flos": 4180748107776000.0,
   "trial_name": null,
   "trial_params": null
 }

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a3f1e893c085069c4b611253e12a40c8bc225aa028961c76af0064dbc5f9d526
 size 440235825

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f3f8b5a9bc2011e7a17493450859f999dce5f00a17fb64c0dbf008775c474de
 size 440235825