Training in progress, step 4

Files changed (10) hide show

last-checkpoint/optimizer.pt +2 -2
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/tokenizer.json +0 -0
last-checkpoint/trainer_state.json +5 -120
last-checkpoint/training_args.bin +1 -1
pytorch_model.bin +1 -1
tokenizer.json +0 -0
training_args.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5eca4bd1a0dc3b2f038f66bf50388447d18eebc41526b5232e9919ecb62a5a4b
-size 532524613

 version https://git-lfs.github.com/spec/v1
+oid sha256:af5dec527a9c814f0b0b0969f34e18dce6cc7e0ca1c062900e9ab561d71c0257
+size 532524485

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:caa61399b7a53227108ebc38249705c50a8fb19b1d595bb3a5d63e8831b7d1a3
 size 266267309

 version https://git-lfs.github.com/spec/v1
+oid sha256:409dfb718254049ca6895716068c3f4df968a22517ef020c66c5c26146f3ab5f
 size 266267309

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f4b6060cf279e50135a405faf92c008144efde33dc3f94ac0484548bac6ae9e8
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:16316a0b550954c0ab10d38c11e7ce2f43ad6cbf8d106a8d9c7a3e97f8b3cf6e
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb688e14e79b4182b9e5a8155b72ea71bee611c12f2cd72cad99d48f21f81233
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:58e38e56f6ae6eafba42fa147eb9fa2dd398045bd711083ebb7e1bfe98b50fd0
 size 627

last-checkpoint/tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,130 +1,15 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.8535120147874307,
-  "global_step": 6175,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.23,
-      "learning_rate": 4.614910659272951e-05,
-      "loss": 0.6968,
-      "step": 500
-    },
-    {
-      "epoch": 0.46,
-      "learning_rate": 4.2298213185459026e-05,
-      "loss": 0.6951,
-      "step": 1000
-    },
-    {
-      "epoch": 0.69,
-      "learning_rate": 3.844731977818854e-05,
-      "loss": 0.6944,
-      "step": 1500
-    },
-    {
-      "epoch": 0.92,
-      "learning_rate": 3.4596426370918056e-05,
-      "loss": 0.6944,
-      "step": 2000
-    },
-    {
-      "epoch": 0.92,
-      "eval_accuracy": {
-        "accuracy": 0.5025017869907077
-      },
-      "eval_f1": {
-        "f1": 0.0
-      },
-      "eval_loss": 0.6932790279388428,
-      "eval_runtime": 11.9399,
-      "eval_samples_per_second": 234.341,
-      "eval_steps_per_second": 1.843,
-      "step": 2000
-    },
-    {
-      "epoch": 1.16,
-      "learning_rate": 3.0745532963647564e-05,
-      "loss": 0.6937,
-      "step": 2500
-    },
-    {
-      "epoch": 1.39,
-      "learning_rate": 2.6894639556377083e-05,
-      "loss": 0.6936,
-      "step": 3000
-    },
-    {
-      "epoch": 1.62,
-      "learning_rate": 2.3043746149106595e-05,
-      "loss": 0.6936,
-      "step": 3500
-    },
-    {
-      "epoch": 1.85,
-      "learning_rate": 1.9192852741836106e-05,
-      "loss": 0.6936,
-      "step": 4000
-    },
-    {
-      "epoch": 1.85,
-      "eval_accuracy": {
-        "accuracy": 0.49749821300929237
-      },
-      "eval_f1": {
-        "f1": 0.6644391408114558
-      },
-      "eval_loss": 0.6938893795013428,
-      "eval_runtime": 11.9588,
-      "eval_samples_per_second": 233.969,
-      "eval_steps_per_second": 1.84,
-      "step": 4000
-    },
-    {
-      "epoch": 2.08,
-      "learning_rate": 1.534195933456562e-05,
-      "loss": 0.6933,
-      "step": 4500
-    },
-    {
-      "epoch": 2.31,
-      "learning_rate": 1.1491065927295133e-05,
-      "loss": 0.6934,
-      "step": 5000
-    },
-    {
-      "epoch": 2.54,
-      "learning_rate": 7.640172520024647e-06,
-      "loss": 0.6935,
-      "step": 5500
-    },
-    {
-      "epoch": 2.77,
-      "learning_rate": 3.789279112754159e-06,
-      "loss": 0.6935,
-      "step": 6000
-    },
-    {
-      "epoch": 2.77,
-      "eval_accuracy": {
-        "accuracy": 0.5025017869907077
-      },
-      "eval_f1": {
-        "f1": 0.0
-      },
-      "eval_loss": 0.6931451559066772,
-      "eval_runtime": 11.9466,
-      "eval_samples_per_second": 234.208,
-      "eval_steps_per_second": 1.842,
-      "step": 6000
-    }
-  ],
-  "max_steps": 6492,
   "num_train_epochs": 3,
-  "total_flos": 1.0469958254972928e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.18181818181818182,
+  "global_step": 4,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
+  "log_history": [],
+  "max_steps": 66,
   "num_train_epochs": 3,
+  "total_flos": 67823308111872.0,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4767a339eceb00e37c148ec2ef95cceaf80d8ec0242cfc80171905c16a7c8fdc
 size 3963

 version https://git-lfs.github.com/spec/v1
+oid sha256:e25d14ad4fc875720ef03324b41abfb757bf175890a09e38c377c5afaad866cc
 size 3963

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:caa61399b7a53227108ebc38249705c50a8fb19b1d595bb3a5d63e8831b7d1a3
 size 266267309

 version https://git-lfs.github.com/spec/v1
+oid sha256:409dfb718254049ca6895716068c3f4df968a22517ef020c66c5c26146f3ab5f
 size 266267309

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4767a339eceb00e37c148ec2ef95cceaf80d8ec0242cfc80171905c16a7c8fdc
 size 3963

 version https://git-lfs.github.com/spec/v1
+oid sha256:e25d14ad4fc875720ef03324b41abfb757bf175890a09e38c377c5afaad866cc
 size 3963