Training in progress, step 40, checkpoint

Files changed (8) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b999a352785b09d15860c1320662d8ec817d298e02812f21d68f01e900838dea
 size 723674912

 version https://git-lfs.github.com/spec/v1
+oid sha256:ecf30145777b99e1483b3b8af8ca3c954b0bee05ef0cd517f6e62511cecc1737
 size 723674912

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2899f09cd2c54fdf5ef96e88d4218eefc8c7ef1b0315b44f21f9a89576e1bb98
 size 735625370

 version https://git-lfs.github.com/spec/v1
+oid sha256:6361dd5e29307df7b873ae303523973ac614868fbd2cc1c02b982d5d15c248f8
 size 735625370

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:69a04a1208f7a0d6f51f37a136b5c2e55bf3f53b3d0fd57164c5b83ca47a2645
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:9664d03c75ff248cdee237bc0f578d0ab4ef30cf459a48b947cc8ba96efcf94a
 size 15024

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:080a7e72d6be938a9418e60003db90412af8a61e6434f9e9f1b598cca861dbcd
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:e0fc8395b524cd5cac61206279bf13d167d68f260f6be7c6c7eca67cec66f27c
 size 15024

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c3d114a75d37be476b865187eb2b3d29d9343b131614a08f42be0014f110ce6f
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ca0fe34fb6c7827e42ed53ce617ab6af68578cc38e07c82ad0cc484dafb3017
 size 15024

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4fc5a0f78838743362c5d5378dff81ea2f7d0039da53a423f1759e861bc6b233
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f1cc5e77aed95b6e97dac8961ae1ecb44cecf9736fe10dadd3ddbb8b2eb1ac6
 size 15024

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3bb34b6c62864960ca7a1a2bf6005b33b4420cc8055506432b79e0fe18bca2cd
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:62b5eb3be65174d535b2988d2d3d904fb7ecffa959b2cce72a3b7b18e92c3e6a
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.5,
   "eval_steps": 20,
-  "global_step": 20,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -37,6 +37,28 @@
       "eval_samples_per_second": 309.27,
       "eval_steps_per_second": 3.503,
       "step": 20
     }
   ],
   "logging_steps": 10,
@@ -56,7 +78,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 7113876738932736.0,
   "train_batch_size": 23,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.0,
   "eval_steps": 20,
+  "global_step": 40,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 309.27,
       "eval_steps_per_second": 3.503,
       "step": 20
+    },
+    {
+      "epoch": 3.75,
+      "grad_norm": 0.162109375,
+      "learning_rate": 0.00019458172417006347,
+      "loss": 2.1785,
+      "step": 30
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 0.1376953125,
+      "learning_rate": 0.0001879473751206489,
+      "loss": 2.136,
+      "step": 40
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 2.082921028137207,
+      "eval_runtime": 4.8453,
+      "eval_samples_per_second": 309.785,
+      "eval_steps_per_second": 3.509,
+      "step": 40
     }
   ],
   "logging_steps": 10,
       "attributes": {}
     }
   },
+  "total_flos": 1.4227753477865472e+16,
   "train_batch_size": 23,
   "trial_name": null,
   "trial_params": null