Training in progress, epoch 1

Files changed (9) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff45c0b93d503c4ab2cceae124b29584f7fbda2cef9dcc16084a848f895df539
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:3856f5d52b139f68324c7fde3f7b30f487ee6e7fee6adeb65d95f8f88928dc48
 size 267832560

run-3/checkpoint-2138/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:80f2c334ed4f1f294a2f916451cea250a4cfa86cd9c6ec539ac77b6e87747ee5
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:3856f5d52b139f68324c7fde3f7b30f487ee6e7fee6adeb65d95f8f88928dc48
 size 267832560

run-3/checkpoint-2138/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c5e39aab0ba5776938cf76f475fbe95fc4816348d471338d1eda66c42a7f697
 size 535727290

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e472fbf5f8cc5c472eae2173d310316c60a1b566a27c98944f6e61017eab16f
 size 535727290

run-3/checkpoint-2138/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d076be17692cfa345b0f1981db591dc8bcdd0b29c1b64b0637d37bb7f8ea4265
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:21acd9373ba2636a96a037599a124a8848e64458d7ed9a26ffc24cbd4056b661
 size 14244

run-3/checkpoint-2138/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f78ca8dc6a7929f80c42b973d6b726c0c10724f3fabc46b62fb266e16c4fb748
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4249bf660aed0d3def9d8b0f79d921f7a157b3f4104064206caa1eaa6c6ede4
 size 1064

run-3/checkpoint-2138/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.3194134442722084,
   "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-2138",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -10,35 +10,35 @@
   "log_history": [
     {
       "epoch": 0.23,
-      "learning_rate": 2.109376138070761e-06,
-      "loss": 0.5971,
       "step": 500
     },
     {
       "epoch": 0.47,
-      "learning_rate": 1.8300625604660523e-06,
-      "loss": 0.575,
       "step": 1000
     },
     {
       "epoch": 0.7,
-      "learning_rate": 1.5507489828613434e-06,
-      "loss": 0.5345,
       "step": 1500
     },
     {
       "epoch": 0.94,
-      "learning_rate": 1.2714354052566345e-06,
-      "loss": 0.5352,
       "step": 2000
     },
     {
       "epoch": 1.0,
-      "eval_loss": 0.5899004936218262,
-      "eval_matthews_correlation": 0.3194134442722084,
-      "eval_runtime": 0.7491,
-      "eval_samples_per_second": 1392.35,
-      "eval_steps_per_second": 88.107,
       "step": 2138
     }
   ],
@@ -47,13 +47,13 @@
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
-  "total_flos": 32608713001968.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": {
-    "learning_rate": 2.38868971567547e-06,
     "num_train_epochs": 2,
     "per_device_train_batch_size": 4,
-    "seed": 28
   }
 }

 {
+  "best_metric": 0.0463559874942472,
   "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-2138",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.23,
+      "learning_rate": 1.3504098486610872e-06,
+      "loss": 0.6235,
       "step": 500
     },
     {
       "epoch": 0.47,
+      "learning_rate": 1.1715949852260916e-06,
+      "loss": 0.6084,
       "step": 1000
     },
     {
       "epoch": 0.7,
+      "learning_rate": 9.92780121791096e-07,
+      "loss": 0.5687,
       "step": 1500
     },
     {
       "epoch": 0.94,
+      "learning_rate": 8.139652583561002e-07,
+      "loss": 0.5599,
       "step": 2000
     },
     {
       "epoch": 1.0,
+      "eval_loss": 0.5971149802207947,
+      "eval_matthews_correlation": 0.0463559874942472,
+      "eval_runtime": 0.7351,
+      "eval_samples_per_second": 1418.884,
+      "eval_steps_per_second": 89.786,
       "step": 2138
     }
   ],
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
+  "total_flos": 32410011903984.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": {
+    "learning_rate": 1.529224712096083e-06,
     "num_train_epochs": 2,
     "per_device_train_batch_size": 4,
+    "seed": 5
   }
 }

run-3/checkpoint-2138/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58fae703abd28cb0ab5528ac939f06e8a9578110f6c6558da0b2c2f9c2704502
 size 4792

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff0b8762417b71e573ee14cf5d6c55e801af11f299848bcf4bde51f1e4499d53
 size 4792

runs/Dec23_01-09-39_cab176ec49ea/events.out.tfevents.1703294598.cab176ec49ea.681.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0aec5cbcca727aa7079f2bff88b7723e3256d02957fd46f8f12881568ec6a043
+size 5459

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57f7a911be8af835fd7cdb5ddc7dfd5e78fd1882a2c8b09cc2ae78dc7aabb4f0
 size 4792

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff0b8762417b71e573ee14cf5d6c55e801af11f299848bcf4bde51f1e4499d53
 size 4792