Training in progress, epoch 0

Files changed (10) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1f11c590e1480fdf74fe4b6544fd70a709a2fdeff7ceaa9f956963ba6391b693
 size 997319621

 version https://git-lfs.github.com/spec/v1
+oid sha256:77d1bf854c477ccb21cecc86ec64b77ce1debd9ab2878382fb7560a3fe193286
 size 997319621

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f49e7f97df5d0c52c5d427c6593efb44759e13cc4ef9a15b734b007a931c1603
 size 498674357

 version https://git-lfs.github.com/spec/v1
+oid sha256:af8c195c1e4723204782fae64803a9762f176f3a479e652248db83d8924cdda2
 size 498674357

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7c35b1ae88be42b3fc92099950abfbbe324644492e7989ad94dbaa43aedacea0
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:01e7f2bd676c936e7a6fdf9cde6071c5938c578820d54a54ab03298d96dc82c2
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2be33b98103a754b8daaa7225a843cc0a81e2ebb32ec4f7e3413258e9dc61582
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6aae226b0a385b18c8012f4d652e8fbdd18f15a3fe78c710dfd63cccbeb8c1b
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,26 +1,32 @@
 {
-  "best_metric": 0.11368015414258188,
-  "best_model_checkpoint": "citation_intent_classification_roberta/checkpoint-26",
-  "epoch": 0.9811320754716981,
-  "global_step": 26,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.98,
-      "eval_accuracy": 0.5175438596491229,
-      "eval_f1_macro": 0.11368015414258188,
-      "eval_loss": 1.3259084224700928,
-      "eval_runtime": 0.2368,
-      "eval_samples_per_second": 481.487,
-      "eval_steps_per_second": 8.447,
-      "step": 26
     }
   ],
-  "max_steps": 260,
   "num_train_epochs": 10,
-  "total_flos": 123604968402720.0,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 0.30339984350547733,
+  "best_model_checkpoint": "citation_intent_classification_roberta/checkpoint-105",
+  "epoch": 0.995260663507109,
+  "global_step": 105,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.95,
+      "learning_rate": 1.9250253292806485e-05,
+      "loss": 1.419,
+      "step": 100
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6842105263157895,
+      "eval_f1_macro": 0.30339984350547733,
+      "eval_loss": 1.025266408920288,
+      "eval_runtime": 0.3451,
+      "eval_samples_per_second": 330.372,
+      "eval_steps_per_second": 23.184,
+      "step": 105
     }
   ],
+  "max_steps": 1050,
   "num_train_epochs": 10,
+  "total_flos": 88083700250400.0,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65cbd8cdabdfc11492daeffbbce5387ff8081c4bddbb5f09577afb9e67d9a373
 size 4027

 version https://git-lfs.github.com/spec/v1
+oid sha256:891f81c4bb14d91ce05b965dabf4fc022a49bfe16e973fcbc64c834412f8a677
 size 4027

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f49e7f97df5d0c52c5d427c6593efb44759e13cc4ef9a15b734b007a931c1603
 size 498674357

 version https://git-lfs.github.com/spec/v1
+oid sha256:af8c195c1e4723204782fae64803a9762f176f3a479e652248db83d8924cdda2
 size 498674357

runs/Apr20_23-32-31_jupyter/events.out.tfevents.1713655956.jupyter.2682803.6 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:afecf619d6907f68001b7148f4f2f1235aace11208ff60659051b0352e43b89c
-size 4721

 version https://git-lfs.github.com/spec/v1
+oid sha256:25541fce3a6985c9f0f0ce418a3cee21dd8a6bf5d8dd60d432679acac9f98cfa
+size 5089

runs/Apr20_23-37-01_jupyter/events.out.tfevents.1713656225.jupyter.2695507.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:90903b8aba13a239fa899ea82a81750291fc80f90e100d263b1ecaa1421fbfdd
+size 4875

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65cbd8cdabdfc11492daeffbbce5387ff8081c4bddbb5f09577afb9e67d9a373
 size 4027

 version https://git-lfs.github.com/spec/v1
+oid sha256:891f81c4bb14d91ce05b965dabf4fc022a49bfe16e973fcbc64c834412f8a677
 size 4027