Ramadhiana
commited on
Upload trainer_state.json with huggingface_hub
Browse files- trainer_state.json +11 -4
trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": 900,
|
| 3 |
"best_metric": 0.5792015790939331,
|
| 4 |
"best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/AITF_baseCPT_V1.2/checkpoint-900",
|
| 5 |
-
"epoch": 0
|
| 6 |
"eval_steps": 100,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -395,6 +395,13 @@
|
|
| 395 |
"eval_samples_per_second": 10.031,
|
| 396 |
"eval_steps_per_second": 2.51,
|
| 397 |
"step": 900
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 398 |
}
|
| 399 |
],
|
| 400 |
"logging_steps": 20,
|
|
@@ -409,12 +416,12 @@
|
|
| 409 |
"should_evaluate": false,
|
| 410 |
"should_log": false,
|
| 411 |
"should_save": true,
|
| 412 |
-
"should_training_stop":
|
| 413 |
},
|
| 414 |
"attributes": {}
|
| 415 |
}
|
| 416 |
},
|
| 417 |
-
"total_flos": 1.
|
| 418 |
"train_batch_size": 4,
|
| 419 |
"trial_name": null,
|
| 420 |
"trial_params": null
|
|
|
|
| 2 |
"best_global_step": 900,
|
| 3 |
"best_metric": 0.5792015790939331,
|
| 4 |
"best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/AITF_baseCPT_V1.2/checkpoint-900",
|
| 5 |
+
"epoch": 1.0,
|
| 6 |
"eval_steps": 100,
|
| 7 |
+
"global_step": 929,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 395 |
"eval_samples_per_second": 10.031,
|
| 396 |
"eval_steps_per_second": 2.51,
|
| 397 |
"step": 900
|
| 398 |
+
},
|
| 399 |
+
{
|
| 400 |
+
"epoch": 0.9904454313013054,
|
| 401 |
+
"grad_norm": 0.33122149109840393,
|
| 402 |
+
"learning_rate": 6.386247842353754e-08,
|
| 403 |
+
"loss": 0.5844,
|
| 404 |
+
"step": 920
|
| 405 |
}
|
| 406 |
],
|
| 407 |
"logging_steps": 20,
|
|
|
|
| 416 |
"should_evaluate": false,
|
| 417 |
"should_log": false,
|
| 418 |
"should_save": true,
|
| 419 |
+
"should_training_stop": true
|
| 420 |
},
|
| 421 |
"attributes": {}
|
| 422 |
}
|
| 423 |
},
|
| 424 |
+
"total_flos": 1.2627950806210068e+18,
|
| 425 |
"train_batch_size": 4,
|
| 426 |
"trial_name": null,
|
| 427 |
"trial_params": null
|