Training in progress, step 11000

Files changed (12) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/content/Socrat_4",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"

 {
+  "_name_or_path": "/content/Socrat/last-checkpoint",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"

last-checkpoint/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/content/Socrat_4",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"

 {
+  "_name_or_path": "/content/Socrat/last-checkpoint",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d43d75d9a69cab6bbdc5d807e2bb46ff6cdc4a8d041a08ec646f4a6e3cd2db85
 size 2847145157

 version https://git-lfs.github.com/spec/v1
+oid sha256:8720595d9cd147ba8bd6abc76e18e81c63e203a5b44ecc616282800b286e6f36
 size 2847145157

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ddbae1252128d10be81c8573c827bec76386fb0202a5c3196a13dad3d7c56f87
 size 1524261149

 version https://git-lfs.github.com/spec/v1
+oid sha256:36f3de48b1b73850c149cde38909a25b776fb76e72c1a1c7caf5503c22ed001a
 size 1524261149

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4726f886967d0edea6aba4d768b4e7e6c5f2c77453e08bd258b36ebd6bbf0054
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8a0709b6819bc1359d68b27147b21e79a4b0ab08155c73633b9b5980d48b775
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d83ea694a86cc0c579d479f8a93d9e180abe564de49dd67c75124cdac727a14a
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f8f9ac5225a5e9f7fe84cd20e2b56b961f452f409f1ca512b75e655587f5d09
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.5012506253126565,
-  "global_step": 10000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -206,11 +206,31 @@
       "eval_samples_per_second": 15.532,
       "eval_steps_per_second": 5.18,
       "step": 10000
     }
   ],
   "max_steps": 19990,
   "num_train_epochs": 5,
-  "total_flos": 1.41481746432e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.7513756878439217,
+  "global_step": 11000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 15.532,
       "eval_steps_per_second": 5.18,
       "step": 10000
+    },
+    {
+      "epoch": 2.63,
+      "learning_rate": 9.494747373686844e-06,
+      "loss": 2.6173,
+      "step": 10500
+    },
+    {
+      "epoch": 2.75,
+      "learning_rate": 8.994497248624313e-06,
+      "loss": 2.6314,
+      "step": 11000
+    },
+    {
+      "epoch": 2.75,
+      "eval_loss": 3.12784481048584,
+      "eval_runtime": 143.6305,
+      "eval_samples_per_second": 14.739,
+      "eval_steps_per_second": 4.915,
+      "step": 11000
     }
   ],
   "max_steps": 19990,
   "num_train_epochs": 5,
+  "total_flos": 1.556299210752e+16,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:918b854d4ced36747513144ebd0eebe9f265f3dbaedccdbeea45c88b4a5aac6b
 size 3515

 version https://git-lfs.github.com/spec/v1
+oid sha256:9c73f1a75e190362ef7c8240bf1c1babc7762c20322487413673a3acb504d42b
 size 3515

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ddbae1252128d10be81c8573c827bec76386fb0202a5c3196a13dad3d7c56f87
 size 1524261149

 version https://git-lfs.github.com/spec/v1
+oid sha256:36f3de48b1b73850c149cde38909a25b776fb76e72c1a1c7caf5503c22ed001a
 size 1524261149

runs/Mar21_22-11-09_493485ec0ec3/1679436700.0595562/events.out.tfevents.1679436700.493485ec0ec3.312.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:95c09fdcaef4701b0ca04894990682343b2e558f5ca942a5b7a1e2cac5b158c6
+size 5742

runs/Mar21_22-11-09_493485ec0ec3/events.out.tfevents.1679436700.493485ec0ec3.312.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e45471f0b2e945d7dfe440a410866c7d81dced0c30e01d0ec457a92a32e67ed5
+size 4797

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:918b854d4ced36747513144ebd0eebe9f265f3dbaedccdbeea45c88b4a5aac6b
 size 3515

 version https://git-lfs.github.com/spec/v1
+oid sha256:9c73f1a75e190362ef7c8240bf1c1babc7762c20322487413673a3acb504d42b
 size 3515