checkpoint 30000

Files changed (5) hide show

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58ff9f13fe4fd43916c511c4e7a58027c1ce30fb6b7744815a66a31aa378e9d7
 size 261189898

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9c4c7ad6ebdf2339a8e4943f3789ad3d1356d61545dc81a808ca389600603c2
 size 261189898

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7318a7e6b468b1f60f77c2df735b4138a4972075a7f9d23b7cbbc3ea18158b34
 size 1044540346

 version https://git-lfs.github.com/spec/v1
+oid sha256:e11dee7b190c2fdad32a73d0114456b9d1228b2639e23b931aba09ba9c01fba5
 size 1044540346

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:453bd6991fe36c7874b91d8fe044905b7822553a1079f2afd925646c3b124eb5
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:c0ddba1f85ace420be047b39da567706e4ccc0c0db8f35bf72010cd9c84b58dc
 size 14244

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:25d9b43d9967cc267ee69f422bfad8c170bd37836e9da711be203c8963d6971e
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:ac7de8907e79c9f47fccf3aa89da8ca3d3d851fdb56e005195640f80ea9c8917
 size 1064

trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 14.634146341463415,
-  "global_step": 15000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -36,11 +36,41 @@
       "learning_rate": 0.0002,
       "loss": 1.3908,
       "step": 15000
     }
   ],
   "max_steps": 30000,
   "num_train_epochs": 30,
-  "total_flos": 3.1738277265408e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 29.26829268292683,
+  "global_step": 30000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.0002,
       "loss": 1.3908,
       "step": 15000
+    },
+    {
+      "epoch": 17.56,
+      "learning_rate": 0.0002,
+      "loss": 1.7294,
+      "step": 18000
+    },
+    {
+      "epoch": 20.49,
+      "learning_rate": 0.0002,
+      "loss": 1.2396,
+      "step": 21000
+    },
+    {
+      "epoch": 23.41,
+      "learning_rate": 0.0002,
+      "loss": 1.5304,
+      "step": 24000
+    },
+    {
+      "epoch": 26.34,
+      "learning_rate": 0.0002,
+      "loss": 2.3882,
+      "step": 27000
+    },
+    {
+      "epoch": 29.27,
+      "learning_rate": 0.0002,
+      "loss": 2.0081,
+      "step": 30000
     }
   ],
   "max_steps": 30000,
   "num_train_epochs": 30,
+  "total_flos": 6.3476554530816e+18,
   "trial_name": null,
   "trial_params": null
 }