Yogesh1p's picture
End of training
262d248
{
"best_metric": 0.8666666666666667,
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-cp1/checkpoint-22",
"epoch": 27.692307692307693,
"eval_steps": 500,
"global_step": 90,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.92,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.43046388030052185,
"eval_runtime": 0.7101,
"eval_samples_per_second": 63.368,
"eval_steps_per_second": 2.816,
"step": 3
},
{
"epoch": 1.85,
"eval_accuracy": 0.8,
"eval_loss": 0.45104652643203735,
"eval_runtime": 0.2996,
"eval_samples_per_second": 150.201,
"eval_steps_per_second": 6.676,
"step": 6
},
{
"epoch": 2.77,
"eval_accuracy": 0.7777777777777778,
"eval_loss": 0.4328728914260864,
"eval_runtime": 0.3627,
"eval_samples_per_second": 124.077,
"eval_steps_per_second": 5.515,
"step": 9
},
{
"epoch": 3.08,
"learning_rate": 4.938271604938271e-05,
"loss": 0.3489,
"step": 10
},
{
"epoch": 4.0,
"eval_accuracy": 0.7777777777777778,
"eval_loss": 0.49650371074676514,
"eval_runtime": 0.3082,
"eval_samples_per_second": 145.987,
"eval_steps_per_second": 6.488,
"step": 13
},
{
"epoch": 4.92,
"eval_accuracy": 0.8,
"eval_loss": 0.4246769845485687,
"eval_runtime": 0.5832,
"eval_samples_per_second": 77.157,
"eval_steps_per_second": 3.429,
"step": 16
},
{
"epoch": 5.85,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.35588106513023376,
"eval_runtime": 0.3557,
"eval_samples_per_second": 126.495,
"eval_steps_per_second": 5.622,
"step": 19
},
{
"epoch": 6.15,
"learning_rate": 4.3209876543209875e-05,
"loss": 0.2872,
"step": 20
},
{
"epoch": 6.77,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.3628138601779938,
"eval_runtime": 0.3453,
"eval_samples_per_second": 130.324,
"eval_steps_per_second": 5.792,
"step": 22
},
{
"epoch": 8.0,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.35114532709121704,
"eval_runtime": 0.3013,
"eval_samples_per_second": 149.361,
"eval_steps_per_second": 6.638,
"step": 26
},
{
"epoch": 8.92,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.353840708732605,
"eval_runtime": 0.3515,
"eval_samples_per_second": 128.025,
"eval_steps_per_second": 5.69,
"step": 29
},
{
"epoch": 9.23,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.3071,
"step": 30
},
{
"epoch": 9.85,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.3643886148929596,
"eval_runtime": 0.2957,
"eval_samples_per_second": 152.16,
"eval_steps_per_second": 6.763,
"step": 32
},
{
"epoch": 10.77,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.38603129982948303,
"eval_runtime": 0.3509,
"eval_samples_per_second": 128.255,
"eval_steps_per_second": 5.7,
"step": 35
},
{
"epoch": 12.0,
"eval_accuracy": 0.8,
"eval_loss": 0.5916851162910461,
"eval_runtime": 0.3126,
"eval_samples_per_second": 143.949,
"eval_steps_per_second": 6.398,
"step": 39
},
{
"epoch": 12.31,
"learning_rate": 3.08641975308642e-05,
"loss": 0.2765,
"step": 40
},
{
"epoch": 12.92,
"eval_accuracy": 0.7777777777777778,
"eval_loss": 0.51491379737854,
"eval_runtime": 0.349,
"eval_samples_per_second": 128.934,
"eval_steps_per_second": 5.73,
"step": 42
},
{
"epoch": 13.85,
"eval_accuracy": 0.7555555555555555,
"eval_loss": 0.5604969263076782,
"eval_runtime": 0.3081,
"eval_samples_per_second": 146.057,
"eval_steps_per_second": 6.491,
"step": 45
},
{
"epoch": 14.77,
"eval_accuracy": 0.8,
"eval_loss": 0.4737274944782257,
"eval_runtime": 0.3434,
"eval_samples_per_second": 131.024,
"eval_steps_per_second": 5.823,
"step": 48
},
{
"epoch": 15.38,
"learning_rate": 2.4691358024691357e-05,
"loss": 0.2637,
"step": 50
},
{
"epoch": 16.0,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.4108584523200989,
"eval_runtime": 0.3059,
"eval_samples_per_second": 147.129,
"eval_steps_per_second": 6.539,
"step": 52
},
{
"epoch": 16.92,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.3583980202674866,
"eval_runtime": 0.3526,
"eval_samples_per_second": 127.634,
"eval_steps_per_second": 5.673,
"step": 55
},
{
"epoch": 17.85,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.3771374523639679,
"eval_runtime": 0.2992,
"eval_samples_per_second": 150.412,
"eval_steps_per_second": 6.685,
"step": 58
},
{
"epoch": 18.46,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.2082,
"step": 60
},
{
"epoch": 18.77,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.4406029284000397,
"eval_runtime": 0.3532,
"eval_samples_per_second": 127.395,
"eval_steps_per_second": 5.662,
"step": 61
},
{
"epoch": 20.0,
"eval_accuracy": 0.8222222222222222,
"eval_loss": 0.35921329259872437,
"eval_runtime": 0.3008,
"eval_samples_per_second": 149.587,
"eval_steps_per_second": 6.648,
"step": 65
},
{
"epoch": 20.92,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.3301694691181183,
"eval_runtime": 0.3427,
"eval_samples_per_second": 131.308,
"eval_steps_per_second": 5.836,
"step": 68
},
{
"epoch": 21.54,
"learning_rate": 1.2345679012345678e-05,
"loss": 0.1944,
"step": 70
},
{
"epoch": 21.85,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.32061001658439636,
"eval_runtime": 0.3167,
"eval_samples_per_second": 142.092,
"eval_steps_per_second": 6.315,
"step": 71
},
{
"epoch": 22.77,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.3215346336364746,
"eval_runtime": 0.354,
"eval_samples_per_second": 127.118,
"eval_steps_per_second": 5.65,
"step": 74
},
{
"epoch": 24.0,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.32090896368026733,
"eval_runtime": 0.3006,
"eval_samples_per_second": 149.688,
"eval_steps_per_second": 6.653,
"step": 78
},
{
"epoch": 24.62,
"learning_rate": 6.172839506172839e-06,
"loss": 0.2144,
"step": 80
},
{
"epoch": 24.92,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.3326983153820038,
"eval_runtime": 0.2977,
"eval_samples_per_second": 151.157,
"eval_steps_per_second": 6.718,
"step": 81
},
{
"epoch": 25.85,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.3506452441215515,
"eval_runtime": 0.3014,
"eval_samples_per_second": 149.324,
"eval_steps_per_second": 6.637,
"step": 84
},
{
"epoch": 26.77,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.3544660210609436,
"eval_runtime": 0.3073,
"eval_samples_per_second": 146.433,
"eval_steps_per_second": 6.508,
"step": 87
},
{
"epoch": 27.69,
"learning_rate": 0.0,
"loss": 0.1754,
"step": 90
},
{
"epoch": 27.69,
"eval_accuracy": 0.8444444444444444,
"eval_loss": 0.34937629103660583,
"eval_runtime": 0.3537,
"eval_samples_per_second": 127.228,
"eval_steps_per_second": 5.655,
"step": 90
},
{
"epoch": 27.69,
"step": 90,
"total_flos": 2.789665591679447e+17,
"train_loss": 0.2528756472799513,
"train_runtime": 227.9034,
"train_samples_per_second": 53.312,
"train_steps_per_second": 0.395
}
],
"logging_steps": 10,
"max_steps": 90,
"num_train_epochs": 30,
"save_steps": 500,
"total_flos": 2.789665591679447e+17,
"trial_name": null,
"trial_params": null
}