faces_age_detection / checkpoint-13224 /trainer_state.json
dima806's picture
Upload folder using huggingface_hub
7cdaa37
{
"best_metric": 0.27537301182746887,
"best_model_checkpoint": "faces_age_detection/checkpoint-13224",
"epoch": 29.0,
"eval_steps": 500,
"global_step": 13224,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.8806292412091302,
"eval_loss": 0.3289386034011841,
"eval_runtime": 29.1731,
"eval_samples_per_second": 111.13,
"eval_steps_per_second": 3.496,
"step": 456
},
{
"epoch": 1.1,
"learning_rate": 1.9339691856199557e-06,
"loss": 0.3578,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.879086983343615,
"eval_loss": 0.3256358802318573,
"eval_runtime": 29.8484,
"eval_samples_per_second": 108.615,
"eval_steps_per_second": 3.417,
"step": 912
},
{
"epoch": 2.19,
"learning_rate": 1.8606016140865737e-06,
"loss": 0.2998,
"step": 1000
},
{
"epoch": 3.0,
"eval_accuracy": 0.8834053053670574,
"eval_loss": 0.3201422393321991,
"eval_runtime": 29.3669,
"eval_samples_per_second": 110.396,
"eval_steps_per_second": 3.473,
"step": 1368
},
{
"epoch": 3.29,
"learning_rate": 1.7872340425531913e-06,
"loss": 0.2666,
"step": 1500
},
{
"epoch": 4.0,
"eval_accuracy": 0.8867982726711906,
"eval_loss": 0.31441426277160645,
"eval_runtime": 29.5521,
"eval_samples_per_second": 109.705,
"eval_steps_per_second": 3.452,
"step": 1824
},
{
"epoch": 4.39,
"learning_rate": 1.7138664710198092e-06,
"loss": 0.2445,
"step": 2000
},
{
"epoch": 5.0,
"eval_accuracy": 0.8840222085132634,
"eval_loss": 0.31040704250335693,
"eval_runtime": 29.3243,
"eval_samples_per_second": 110.557,
"eval_steps_per_second": 3.478,
"step": 2280
},
{
"epoch": 5.48,
"learning_rate": 1.6404988994864268e-06,
"loss": 0.2307,
"step": 2500
},
{
"epoch": 6.0,
"eval_accuracy": 0.8756940160394818,
"eval_loss": 0.31916671991348267,
"eval_runtime": 29.1138,
"eval_samples_per_second": 111.356,
"eval_steps_per_second": 3.503,
"step": 2736
},
{
"epoch": 6.58,
"learning_rate": 1.5671313279530447e-06,
"loss": 0.2218,
"step": 3000
},
{
"epoch": 7.0,
"eval_accuracy": 0.8821714990746453,
"eval_loss": 0.30659398436546326,
"eval_runtime": 29.0887,
"eval_samples_per_second": 111.452,
"eval_steps_per_second": 3.507,
"step": 3192
},
{
"epoch": 7.68,
"learning_rate": 1.4937637564196623e-06,
"loss": 0.2007,
"step": 3500
},
{
"epoch": 8.0,
"eval_accuracy": 0.8793954349167181,
"eval_loss": 0.3129652738571167,
"eval_runtime": 28.3857,
"eval_samples_per_second": 114.212,
"eval_steps_per_second": 3.593,
"step": 3648
},
{
"epoch": 8.77,
"learning_rate": 1.4203961848862801e-06,
"loss": 0.192,
"step": 4000
},
{
"epoch": 9.0,
"eval_accuracy": 0.8809376927822332,
"eval_loss": 0.31223684549331665,
"eval_runtime": 28.6423,
"eval_samples_per_second": 113.189,
"eval_steps_per_second": 3.561,
"step": 4104
},
{
"epoch": 9.87,
"learning_rate": 1.3470286133528978e-06,
"loss": 0.1832,
"step": 4500
},
{
"epoch": 10.0,
"eval_accuracy": 0.8883405305367057,
"eval_loss": 0.29440754652023315,
"eval_runtime": 29.0492,
"eval_samples_per_second": 111.604,
"eval_steps_per_second": 3.511,
"step": 4560
},
{
"epoch": 10.96,
"learning_rate": 1.2736610418195158e-06,
"loss": 0.1743,
"step": 5000
},
{
"epoch": 11.0,
"eval_accuracy": 0.8815545959284392,
"eval_loss": 0.3053087294101715,
"eval_runtime": 29.3331,
"eval_samples_per_second": 110.523,
"eval_steps_per_second": 3.477,
"step": 5016
},
{
"epoch": 12.0,
"eval_accuracy": 0.8858729179518815,
"eval_loss": 0.2922166883945465,
"eval_runtime": 29.148,
"eval_samples_per_second": 111.225,
"eval_steps_per_second": 3.499,
"step": 5472
},
{
"epoch": 12.06,
"learning_rate": 1.2002934702861334e-06,
"loss": 0.1668,
"step": 5500
},
{
"epoch": 13.0,
"eval_accuracy": 0.8815545959284392,
"eval_loss": 0.3020872473716736,
"eval_runtime": 29.262,
"eval_samples_per_second": 110.792,
"eval_steps_per_second": 3.486,
"step": 5928
},
{
"epoch": 13.16,
"learning_rate": 1.1269258987527513e-06,
"loss": 0.1608,
"step": 6000
},
{
"epoch": 14.0,
"eval_accuracy": 0.8830968537939543,
"eval_loss": 0.3037404716014862,
"eval_runtime": 29.0749,
"eval_samples_per_second": 111.505,
"eval_steps_per_second": 3.508,
"step": 6384
},
{
"epoch": 14.25,
"learning_rate": 1.053558327219369e-06,
"loss": 0.1563,
"step": 6500
},
{
"epoch": 15.0,
"eval_accuracy": 0.8843306600863664,
"eval_loss": 0.29694926738739014,
"eval_runtime": 29.4263,
"eval_samples_per_second": 110.173,
"eval_steps_per_second": 3.466,
"step": 6840
},
{
"epoch": 15.35,
"learning_rate": 9.801907556859868e-07,
"loss": 0.1467,
"step": 7000
},
{
"epoch": 16.0,
"eval_accuracy": 0.8877236273904997,
"eval_loss": 0.29596608877182007,
"eval_runtime": 29.2838,
"eval_samples_per_second": 110.71,
"eval_steps_per_second": 3.483,
"step": 7296
},
{
"epoch": 16.45,
"learning_rate": 9.068231841526045e-07,
"loss": 0.139,
"step": 7500
},
{
"epoch": 17.0,
"eval_accuracy": 0.8864898210980876,
"eval_loss": 0.2912845313549042,
"eval_runtime": 29.0512,
"eval_samples_per_second": 111.596,
"eval_steps_per_second": 3.511,
"step": 7752
},
{
"epoch": 17.54,
"learning_rate": 8.334556126192222e-07,
"loss": 0.1363,
"step": 8000
},
{
"epoch": 18.0,
"eval_accuracy": 0.891425046267736,
"eval_loss": 0.2851228415966034,
"eval_runtime": 29.8791,
"eval_samples_per_second": 108.504,
"eval_steps_per_second": 3.414,
"step": 8208
},
{
"epoch": 18.64,
"learning_rate": 7.6008804108584e-07,
"loss": 0.1283,
"step": 8500
},
{
"epoch": 19.0,
"eval_accuracy": 0.892350400987045,
"eval_loss": 0.28452929854393005,
"eval_runtime": 29.4229,
"eval_samples_per_second": 110.186,
"eval_steps_per_second": 3.467,
"step": 8664
},
{
"epoch": 19.74,
"learning_rate": 6.867204695524578e-07,
"loss": 0.1302,
"step": 9000
},
{
"epoch": 20.0,
"eval_accuracy": 0.8901912399753239,
"eval_loss": 0.28534042835235596,
"eval_runtime": 29.1008,
"eval_samples_per_second": 111.406,
"eval_steps_per_second": 3.505,
"step": 9120
},
{
"epoch": 20.83,
"learning_rate": 6.133528980190756e-07,
"loss": 0.1269,
"step": 9500
},
{
"epoch": 21.0,
"eval_accuracy": 0.892041949413942,
"eval_loss": 0.28531745076179504,
"eval_runtime": 28.8168,
"eval_samples_per_second": 112.504,
"eval_steps_per_second": 3.54,
"step": 9576
},
{
"epoch": 21.93,
"learning_rate": 5.399853264856933e-07,
"loss": 0.1211,
"step": 10000
},
{
"epoch": 22.0,
"eval_accuracy": 0.892041949413942,
"eval_loss": 0.2809159457683563,
"eval_runtime": 28.7701,
"eval_samples_per_second": 112.686,
"eval_steps_per_second": 3.545,
"step": 10032
},
{
"epoch": 23.0,
"eval_accuracy": 0.8892658852560148,
"eval_loss": 0.28494611382484436,
"eval_runtime": 28.5362,
"eval_samples_per_second": 113.61,
"eval_steps_per_second": 3.574,
"step": 10488
},
{
"epoch": 23.03,
"learning_rate": 4.6661775495231103e-07,
"loss": 0.1199,
"step": 10500
},
{
"epoch": 24.0,
"eval_accuracy": 0.8942011104256632,
"eval_loss": 0.2793309986591339,
"eval_runtime": 28.7961,
"eval_samples_per_second": 112.585,
"eval_steps_per_second": 3.542,
"step": 10944
},
{
"epoch": 24.12,
"learning_rate": 3.932501834189288e-07,
"loss": 0.1197,
"step": 11000
},
{
"epoch": 25.0,
"eval_accuracy": 0.8948180135718692,
"eval_loss": 0.2778417766094208,
"eval_runtime": 27.4503,
"eval_samples_per_second": 118.105,
"eval_steps_per_second": 3.716,
"step": 11400
},
{
"epoch": 25.22,
"learning_rate": 3.1988261188554655e-07,
"loss": 0.1163,
"step": 11500
},
{
"epoch": 26.0,
"eval_accuracy": 0.8960518198642813,
"eval_loss": 0.27623382210731506,
"eval_runtime": 27.6199,
"eval_samples_per_second": 117.379,
"eval_steps_per_second": 3.693,
"step": 11856
},
{
"epoch": 26.32,
"learning_rate": 2.4651504035216434e-07,
"loss": 0.1152,
"step": 12000
},
{
"epoch": 27.0,
"eval_accuracy": 0.8963602714373843,
"eval_loss": 0.2759145498275757,
"eval_runtime": 29.0519,
"eval_samples_per_second": 111.594,
"eval_steps_per_second": 3.511,
"step": 12312
},
{
"epoch": 27.41,
"learning_rate": 1.7314746881878208e-07,
"loss": 0.1105,
"step": 12500
},
{
"epoch": 28.0,
"eval_accuracy": 0.8969771745835904,
"eval_loss": 0.27611085772514343,
"eval_runtime": 27.509,
"eval_samples_per_second": 117.852,
"eval_steps_per_second": 3.708,
"step": 12768
},
{
"epoch": 28.51,
"learning_rate": 9.977989728539984e-08,
"loss": 0.11,
"step": 13000
},
{
"epoch": 29.0,
"eval_accuracy": 0.8969771745835904,
"eval_loss": 0.27537301182746887,
"eval_runtime": 28.0691,
"eval_samples_per_second": 115.501,
"eval_steps_per_second": 3.634,
"step": 13224
}
],
"logging_steps": 500,
"max_steps": 13680,
"num_input_tokens_seen": 0,
"num_train_epochs": 30,
"save_steps": 500,
"total_flos": 6.555338630367276e+19,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}