Training in progress, step 4500
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +25 -5
- pytorch_model.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 484047087
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40f4f98e46de3c07a828a394b19de608600df5a8959a611b94c49f6e55c00421
|
| 3 |
size 484047087
|
last-checkpoint/pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 242012923
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54602dfec10bab76ce2c95f67a8cbdf28da47412951809b31f0391258fc69619
|
| 3 |
size 242012923
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01090280fcabe40622fe48a644e9b4896052397cf0ee2744cb3076b4fb0679f0
|
| 3 |
size 14503
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 559
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81892849a9975e89bed9f593eaf444b5c98c6c493066ba697087e4a58e0c4ab9
|
| 3 |
size 559
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 623
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a48f8e819e8957fd0b49886c63ef7f3d8411579a2765052e7e9467496739fb02
|
| 3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric": 0.
|
| 3 |
-
"best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-
|
| 4 |
-
"epoch": 1.
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -166,11 +166,31 @@
|
|
| 166 |
"eval_samples_per_second": 75.83,
|
| 167 |
"eval_steps_per_second": 2.389,
|
| 168 |
"step": 4000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 169 |
}
|
| 170 |
],
|
| 171 |
"max_steps": 31250,
|
| 172 |
"num_train_epochs": 10,
|
| 173 |
-
"total_flos": 1.
|
| 174 |
"trial_name": null,
|
| 175 |
"trial_params": null
|
| 176 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 0.7942736744880676,
|
| 3 |
+
"best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-4500",
|
| 4 |
+
"epoch": 1.44,
|
| 5 |
+
"global_step": 4500,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 166 |
"eval_samples_per_second": 75.83,
|
| 167 |
"eval_steps_per_second": 2.389,
|
| 168 |
"step": 4000
|
| 169 |
+
},
|
| 170 |
+
{
|
| 171 |
+
"epoch": 1.44,
|
| 172 |
+
"learning_rate": 9.012362313470542e-05,
|
| 173 |
+
"loss": 0.6236,
|
| 174 |
+
"step": 4500
|
| 175 |
+
},
|
| 176 |
+
{
|
| 177 |
+
"epoch": 1.44,
|
| 178 |
+
"eval_bleu": 0.12748409364928656,
|
| 179 |
+
"eval_exact_match": 0.163,
|
| 180 |
+
"eval_loss": 0.7942736744880676,
|
| 181 |
+
"eval_rouge1": 0.563881072938117,
|
| 182 |
+
"eval_rouge2": 0.3930844670404538,
|
| 183 |
+
"eval_rougeL": 0.5455192493710137,
|
| 184 |
+
"eval_rougeLsum": 0.5541560433164279,
|
| 185 |
+
"eval_runtime": 26.3891,
|
| 186 |
+
"eval_samples_per_second": 75.789,
|
| 187 |
+
"eval_steps_per_second": 2.387,
|
| 188 |
+
"step": 4500
|
| 189 |
}
|
| 190 |
],
|
| 191 |
"max_steps": 31250,
|
| 192 |
"num_train_epochs": 10,
|
| 193 |
+
"total_flos": 1.915698912480461e+16,
|
| 194 |
"trial_name": null,
|
| 195 |
"trial_params": null
|
| 196 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 242012923
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54602dfec10bab76ce2c95f67a8cbdf28da47412951809b31f0391258fc69619
|
| 3 |
size 242012923
|