SodaXII's picture
Training in progress, epoch 12
ef3461b verified
{
"best_metric": 0.7892076373100281,
"best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/deit-base-patch16-224_rice-leaf-disease-augmented_tl_020125/checkpoint-2750",
"epoch": 11.0,
"eval_steps": 500,
"global_step": 2750,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.9162791967391968,
"learning_rate": 6.666666666666667e-05,
"loss": 2.0085,
"step": 250
},
{
"epoch": 1.0,
"eval_accuracy": 0.4305,
"eval_loss": 1.792047381401062,
"eval_runtime": 84.9032,
"eval_samples_per_second": 23.556,
"eval_steps_per_second": 0.377,
"step": 250
},
{
"epoch": 2.0,
"grad_norm": 2.125405788421631,
"learning_rate": 9.62962962962963e-05,
"loss": 1.5371,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.5935,
"eval_loss": 1.3466979265213013,
"eval_runtime": 82.4206,
"eval_samples_per_second": 24.266,
"eval_steps_per_second": 0.388,
"step": 500
},
{
"epoch": 3.0,
"grad_norm": 1.350229263305664,
"learning_rate": 8.888888888888889e-05,
"loss": 1.2212,
"step": 750
},
{
"epoch": 3.0,
"eval_accuracy": 0.658,
"eval_loss": 1.1434305906295776,
"eval_runtime": 82.3983,
"eval_samples_per_second": 24.272,
"eval_steps_per_second": 0.388,
"step": 750
},
{
"epoch": 4.0,
"grad_norm": 1.5317795276641846,
"learning_rate": 8.148148148148148e-05,
"loss": 1.0695,
"step": 1000
},
{
"epoch": 4.0,
"eval_accuracy": 0.6845,
"eval_loss": 1.032365083694458,
"eval_runtime": 83.1096,
"eval_samples_per_second": 24.065,
"eval_steps_per_second": 0.385,
"step": 1000
},
{
"epoch": 5.0,
"grad_norm": 1.244685411453247,
"learning_rate": 7.407407407407407e-05,
"loss": 0.9787,
"step": 1250
},
{
"epoch": 5.0,
"eval_accuracy": 0.707,
"eval_loss": 0.9591642022132874,
"eval_runtime": 82.6395,
"eval_samples_per_second": 24.201,
"eval_steps_per_second": 0.387,
"step": 1250
},
{
"epoch": 6.0,
"grad_norm": 1.4709614515304565,
"learning_rate": 6.666666666666667e-05,
"loss": 0.916,
"step": 1500
},
{
"epoch": 6.0,
"eval_accuracy": 0.7175,
"eval_loss": 0.9066343903541565,
"eval_runtime": 82.3354,
"eval_samples_per_second": 24.291,
"eval_steps_per_second": 0.389,
"step": 1500
},
{
"epoch": 7.0,
"grad_norm": 1.2172740697860718,
"learning_rate": 5.925925925925926e-05,
"loss": 0.8713,
"step": 1750
},
{
"epoch": 7.0,
"eval_accuracy": 0.7255,
"eval_loss": 0.8704714179039001,
"eval_runtime": 81.2079,
"eval_samples_per_second": 24.628,
"eval_steps_per_second": 0.394,
"step": 1750
},
{
"epoch": 8.0,
"grad_norm": 1.2027114629745483,
"learning_rate": 5.185185185185185e-05,
"loss": 0.8382,
"step": 2000
},
{
"epoch": 8.0,
"eval_accuracy": 0.736,
"eval_loss": 0.8404390811920166,
"eval_runtime": 82.8948,
"eval_samples_per_second": 24.127,
"eval_steps_per_second": 0.386,
"step": 2000
},
{
"epoch": 9.0,
"grad_norm": 1.447483777999878,
"learning_rate": 4.4444444444444447e-05,
"loss": 0.8123,
"step": 2250
},
{
"epoch": 9.0,
"eval_accuracy": 0.7405,
"eval_loss": 0.8189741373062134,
"eval_runtime": 80.1471,
"eval_samples_per_second": 24.954,
"eval_steps_per_second": 0.399,
"step": 2250
},
{
"epoch": 10.0,
"grad_norm": 1.2021894454956055,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.7927,
"step": 2500
},
{
"epoch": 10.0,
"eval_accuracy": 0.746,
"eval_loss": 0.8022432923316956,
"eval_runtime": 80.7389,
"eval_samples_per_second": 24.771,
"eval_steps_per_second": 0.396,
"step": 2500
},
{
"epoch": 11.0,
"grad_norm": 0.9182590246200562,
"learning_rate": 2.962962962962963e-05,
"loss": 0.7772,
"step": 2750
},
{
"epoch": 11.0,
"eval_accuracy": 0.753,
"eval_loss": 0.7892076373100281,
"eval_runtime": 81.7439,
"eval_samples_per_second": 24.467,
"eval_steps_per_second": 0.391,
"step": 2750
}
],
"logging_steps": 500,
"max_steps": 3750,
"num_input_tokens_seen": 0,
"num_train_epochs": 15,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.3639323602386944e+19,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}