Training in progress, step 2100, checkpoint

Files changed (8) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:caf96f2d62cddc6fc7aef86afed7385860dc88331433a83ae6b7e9403b958447
 size 2682482800

 version https://git-lfs.github.com/spec/v1
+oid sha256:a785245b9db918f8075f864bb71b2ef94bdafb7e3dfb6d5b8ae27897b53e5856
 size 2682482800

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b7918ffccb124a064f589acf5d911356d6c8d6e0a5a05a633194d0317ff5b135
 size 5365108834

 version https://git-lfs.github.com/spec/v1
+oid sha256:f18aa6e97bfed0261afda1f92b597f5249cac28141302e759a490137ffb174ed
 size 5365108834

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f6e41fc7393e4681202895f12ea2bdd6fcdbe52f58f01d5a51f67dfdd0eb7cf4
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:8b73bcda2af2a8653a39b5acd3cf8db4779d11cc560ce05a1ed022d03a6467c6
 size 15024

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:47970a80ccd55cd9b1e285608a69c5a852edb532757a89198968e982fdaea9d0
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:7669ee2b753b4a1b38f068a799eadb312c8a89e69d877b91860a8c132c26bd0d
 size 15024

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:72985cd90a25d0c462ffc57bcd399b30b144c7fb5a1dd290d1cafafcbd2772ae
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:7b5fc7daea5a1677f0ca4be841f484245a233687c2c91d61d675ad21da37b200
 size 15024

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b232b8c73f42212c2ad02445b917ce897a3fa48fa4fb0b636a2fec7bc9464b23
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:5bd36615d87deabb9ffc7df98612a630cff63482f076572324115b3e7de11263
 size 15024

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:79835d376c5ef7814504b05c236a39cb31e7978e87454f4c1983636759268bec
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:891dcd976a2cfcf266a598c09521a8a1af39423c8f98b39c83ad1e33e92dfeb2
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.1535046429158207,
   "eval_steps": 100,
-  "global_step": 2000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -287,6 +287,20 @@
       "learning_rate": 0.0008464844949339884,
       "loss": 1.7085,
       "step": 2000
     }
   ],
   "logging_steps": 50,
@@ -306,7 +320,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 3.4283095449696993e+18,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.16117987506161172,
   "eval_steps": 100,
+  "global_step": 2100,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.0008464844949339884,
       "loss": 1.7085,
       "step": 2000
+    },
+    {
+      "epoch": 0.1573422589887162,
+      "grad_norm": 0.6814237833023071,
+      "learning_rate": 0.0008426466073073382,
+      "loss": 1.7057,
+      "step": 2050
+    },
+    {
+      "epoch": 0.16117987506161172,
+      "grad_norm": 0.453630268573761,
+      "learning_rate": 0.0008388087196806877,
+      "loss": 1.705,
+      "step": 2100
     }
   ],
   "logging_steps": 50,
       "attributes": {}
     }
   },
+  "total_flos": 3.599673019183661e+18,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null