Training in progress, step 100, checkpoint

Files changed (6) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d5caa6b92b6430b5541b79e0b58f7ca5bb7d35f38bba2d968f71df2dc83838d5
 size 2611614300

 version https://git-lfs.github.com/spec/v1
+oid sha256:507d55726514d36d57a7fdead1e533238594fb1d956a903a49ce02157b571e17
 size 2611614300

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a616e5e2709e474c9e362c0f8f56e247d8aba32eca2de467636730b28c4d4ef
 size 5213028466

 version https://git-lfs.github.com/spec/v1
+oid sha256:2fb309794c77ba81c5d999193c64bdbf97c4b11eecd10e3754dddae31d948844
 size 5213028466

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7e3307365943bdb97704420d03c23d6d5be63a26f2aeac779ce1f4ea6ad16d9e
 size 14942

 version https://git-lfs.github.com/spec/v1
+oid sha256:874b9aec013ad321d4edc1c021ca42f8014c7ff34d53714ff8059015e8ee9794
 size 14942

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68efe461a0b35c4aec0914c8e4be32a81c4a4261603765c475d2e90661d821c9
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:c39af0f6970331c0f430d145f5514421d9baa7e90f9cf02971fb62606bf1ff3d
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,26 +1,26 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.24843756065370134,
-  "eval_steps": 5000,
-  "global_step": 1000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.24843756065370134,
-      "grad_norm": 0.6212329864501953,
-      "learning_rate": 0.0009751552795031056,
-      "loss": 5.552229361614273e+25,
-      "step": 1000
     }
   ],
-  "logging_steps": 1000,
   "max_steps": 40250,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 10,
-  "save_steps": 1000,
   "stateful_callbacks": {
     "TrainerControl": {
       "args": {
@@ -33,7 +33,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.9448797327261696e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.024843756065370134,
+  "eval_steps": 500,
+  "global_step": 100,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.024843756065370134,
+      "grad_norm": 0.9147792458534241,
+      "learning_rate": 0.0009975155279503105,
+      "loss": 1.0811305421386547e+17,
+      "step": 100
     }
   ],
+  "logging_steps": 100,
   "max_steps": 40250,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 10,
+  "save_steps": 100,
   "stateful_callbacks": {
     "TrainerControl": {
       "args": {
       "attributes": {}
     }
   },
+  "total_flos": 1.9448797327261696e+16,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b7148c30a014b8855d44fa1707c1d7591fba5860cd9f37063b980d6b66e148b9
 size 5176

 version https://git-lfs.github.com/spec/v1
+oid sha256:0aae1b036793cf546f080bfdd66ff5e43f2ec5b41ab240614331a01cb7e0e4a5
 size 5176