TopLength / trainer_state.json
DumbledoreWiz's picture
Upload 4 files
77c23a1 verified
{
"best_metric": 0.8563636363636363,
"best_model_checkpoint": "/content/drive/MyDrive/autoTaggingProject/ViT/General/Features/TopLength/Results/model_2024-10-16_test/checkpoint-1925",
"epoch": 7.0,
"eval_steps": 500,
"global_step": 1925,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.36363636363636365,
"grad_norm": 1.4969431161880493,
"learning_rate": 9.81818181818182e-06,
"loss": 1.6534,
"step": 100
},
{
"epoch": 0.7272727272727273,
"grad_norm": 2.2577221393585205,
"learning_rate": 9.636363636363638e-06,
"loss": 1.317,
"step": 200
},
{
"epoch": 1.0,
"eval_accuracy": 0.7218181818181818,
"eval_loss": 1.0995656251907349,
"eval_runtime": 12.6938,
"eval_samples_per_second": 43.328,
"eval_steps_per_second": 1.418,
"step": 275
},
{
"epoch": 1.0909090909090908,
"grad_norm": 2.7553977966308594,
"learning_rate": 9.454545454545456e-06,
"loss": 1.0529,
"step": 300
},
{
"epoch": 1.4545454545454546,
"grad_norm": 2.5488719940185547,
"learning_rate": 9.272727272727273e-06,
"loss": 0.9003,
"step": 400
},
{
"epoch": 1.8181818181818183,
"grad_norm": 2.936871290206909,
"learning_rate": 9.090909090909091e-06,
"loss": 0.7955,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.7890909090909091,
"eval_loss": 0.8251153826713562,
"eval_runtime": 11.8903,
"eval_samples_per_second": 46.256,
"eval_steps_per_second": 1.514,
"step": 550
},
{
"epoch": 2.1818181818181817,
"grad_norm": 3.6827473640441895,
"learning_rate": 8.90909090909091e-06,
"loss": 0.7386,
"step": 600
},
{
"epoch": 2.5454545454545454,
"grad_norm": 2.6154849529266357,
"learning_rate": 8.727272727272728e-06,
"loss": 0.6758,
"step": 700
},
{
"epoch": 2.909090909090909,
"grad_norm": 6.043990135192871,
"learning_rate": 8.545454545454546e-06,
"loss": 0.6518,
"step": 800
},
{
"epoch": 3.0,
"eval_accuracy": 0.82,
"eval_loss": 0.7125250101089478,
"eval_runtime": 11.5548,
"eval_samples_per_second": 47.599,
"eval_steps_per_second": 1.558,
"step": 825
},
{
"epoch": 3.2727272727272725,
"grad_norm": 1.676995873451233,
"learning_rate": 8.363636363636365e-06,
"loss": 0.6034,
"step": 900
},
{
"epoch": 3.6363636363636362,
"grad_norm": 2.6665966510772705,
"learning_rate": 8.181818181818183e-06,
"loss": 0.5865,
"step": 1000
},
{
"epoch": 4.0,
"grad_norm": 3.419482469558716,
"learning_rate": 8.000000000000001e-06,
"loss": 0.5531,
"step": 1100
},
{
"epoch": 4.0,
"eval_accuracy": 0.8218181818181818,
"eval_loss": 0.5728441476821899,
"eval_runtime": 11.88,
"eval_samples_per_second": 46.296,
"eval_steps_per_second": 1.515,
"step": 1100
},
{
"epoch": 4.363636363636363,
"grad_norm": 2.151674747467041,
"learning_rate": 7.81818181818182e-06,
"loss": 0.5151,
"step": 1200
},
{
"epoch": 4.7272727272727275,
"grad_norm": 4.103756427764893,
"learning_rate": 7.63818181818182e-06,
"loss": 0.5118,
"step": 1300
},
{
"epoch": 5.0,
"eval_accuracy": 0.84,
"eval_loss": 0.631469190120697,
"eval_runtime": 11.4374,
"eval_samples_per_second": 48.088,
"eval_steps_per_second": 1.574,
"step": 1375
},
{
"epoch": 5.090909090909091,
"grad_norm": 2.0776937007904053,
"learning_rate": 7.456363636363637e-06,
"loss": 0.4878,
"step": 1400
},
{
"epoch": 5.454545454545454,
"grad_norm": 4.111904621124268,
"learning_rate": 7.274545454545456e-06,
"loss": 0.4802,
"step": 1500
},
{
"epoch": 5.818181818181818,
"grad_norm": 3.490161657333374,
"learning_rate": 7.092727272727273e-06,
"loss": 0.4713,
"step": 1600
},
{
"epoch": 6.0,
"eval_accuracy": 0.84,
"eval_loss": 0.4893127381801605,
"eval_runtime": 11.1344,
"eval_samples_per_second": 49.396,
"eval_steps_per_second": 1.617,
"step": 1650
},
{
"epoch": 6.181818181818182,
"grad_norm": 3.1339528560638428,
"learning_rate": 6.910909090909092e-06,
"loss": 0.4365,
"step": 1700
},
{
"epoch": 6.545454545454545,
"grad_norm": 3.686084032058716,
"learning_rate": 6.72909090909091e-06,
"loss": 0.4155,
"step": 1800
},
{
"epoch": 6.909090909090909,
"grad_norm": 3.6479032039642334,
"learning_rate": 6.5472727272727275e-06,
"loss": 0.4251,
"step": 1900
},
{
"epoch": 7.0,
"eval_accuracy": 0.8563636363636363,
"eval_loss": 0.48278242349624634,
"eval_runtime": 11.2502,
"eval_samples_per_second": 48.888,
"eval_steps_per_second": 1.6,
"step": 1925
}
],
"logging_steps": 100,
"max_steps": 5500,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 4.773677693976576e+18,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}