| { | |
| "best_metric": 0.24626319110393524, | |
| "best_model_checkpoint": "faces_age_detection/checkpoint-4864", | |
| "epoch": 16.0, | |
| "eval_steps": 500, | |
| "global_step": 4864, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.9048206710374084, | |
| "eval_loss": 0.25544658303260803, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 115.8575, | |
| "eval_samples_per_second": 111.905, | |
| "eval_steps_per_second": 3.504, | |
| "step": 304 | |
| }, | |
| { | |
| "epoch": 1.6447368421052633, | |
| "grad_norm": 9.665897369384766, | |
| "learning_rate": 9.253731343283582e-07, | |
| "loss": 0.1128, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.9051291939838025, | |
| "eval_loss": 0.25322863459587097, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 116.0042, | |
| "eval_samples_per_second": 111.763, | |
| "eval_steps_per_second": 3.5, | |
| "step": 608 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.909371384496722, | |
| "eval_loss": 0.24770796298980713, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 115.4652, | |
| "eval_samples_per_second": 112.285, | |
| "eval_steps_per_second": 3.516, | |
| "step": 912 | |
| }, | |
| { | |
| "epoch": 3.2894736842105265, | |
| "grad_norm": 5.963768482208252, | |
| "learning_rate": 8.424543946932007e-07, | |
| "loss": 0.1092, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.9075973775549556, | |
| "eval_loss": 0.2508331835269928, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 110.7185, | |
| "eval_samples_per_second": 117.099, | |
| "eval_steps_per_second": 3.667, | |
| "step": 1216 | |
| }, | |
| { | |
| "epoch": 4.934210526315789, | |
| "grad_norm": 6.369262218475342, | |
| "learning_rate": 7.595356550580431e-07, | |
| "loss": 0.1013, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9069803316621674, | |
| "eval_loss": 0.24949955940246582, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 114.7896, | |
| "eval_samples_per_second": 112.946, | |
| "eval_steps_per_second": 3.537, | |
| "step": 1520 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.9052834554569996, | |
| "eval_loss": 0.2557480037212372, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 117.3931, | |
| "eval_samples_per_second": 110.441, | |
| "eval_steps_per_second": 3.458, | |
| "step": 1824 | |
| }, | |
| { | |
| "epoch": 6.578947368421053, | |
| "grad_norm": 8.901986122131348, | |
| "learning_rate": 6.766169154228856e-07, | |
| "loss": 0.097, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.9085229463941381, | |
| "eval_loss": 0.2521224617958069, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 116.8685, | |
| "eval_samples_per_second": 110.937, | |
| "eval_steps_per_second": 3.474, | |
| "step": 2128 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.9035865792518318, | |
| "eval_loss": 0.2614166736602783, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 117.7658, | |
| "eval_samples_per_second": 110.091, | |
| "eval_steps_per_second": 3.448, | |
| "step": 2432 | |
| }, | |
| { | |
| "epoch": 8.223684210526315, | |
| "grad_norm": 9.241392135620117, | |
| "learning_rate": 5.93698175787728e-07, | |
| "loss": 0.0981, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.9066718087157732, | |
| "eval_loss": 0.25424298644065857, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 117.1049, | |
| "eval_samples_per_second": 110.713, | |
| "eval_steps_per_second": 3.467, | |
| "step": 2736 | |
| }, | |
| { | |
| "epoch": 9.868421052631579, | |
| "grad_norm": 15.468152046203613, | |
| "learning_rate": 5.107794361525704e-07, | |
| "loss": 0.0928, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.9087543386039336, | |
| "eval_loss": 0.2496512234210968, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 117.518, | |
| "eval_samples_per_second": 110.324, | |
| "eval_steps_per_second": 3.455, | |
| "step": 3040 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.9098341689163132, | |
| "eval_loss": 0.2480880618095398, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 119.13, | |
| "eval_samples_per_second": 108.831, | |
| "eval_steps_per_second": 3.408, | |
| "step": 3344 | |
| }, | |
| { | |
| "epoch": 11.513157894736842, | |
| "grad_norm": 9.02236557006836, | |
| "learning_rate": 4.278606965174129e-07, | |
| "loss": 0.088, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.9090628615503278, | |
| "eval_loss": 0.2512376010417938, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 117.373, | |
| "eval_samples_per_second": 110.46, | |
| "eval_steps_per_second": 3.459, | |
| "step": 3648 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_accuracy": 0.9090628615503278, | |
| "eval_loss": 0.2498735636472702, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 116.0104, | |
| "eval_samples_per_second": 111.757, | |
| "eval_steps_per_second": 3.5, | |
| "step": 3952 | |
| }, | |
| { | |
| "epoch": 13.157894736842104, | |
| "grad_norm": 10.029730796813965, | |
| "learning_rate": 3.4494195688225535e-07, | |
| "loss": 0.0855, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_accuracy": 0.9099112996529117, | |
| "eval_loss": 0.24805885553359985, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 116.2889, | |
| "eval_samples_per_second": 111.49, | |
| "eval_steps_per_second": 3.491, | |
| "step": 4256 | |
| }, | |
| { | |
| "epoch": 14.802631578947368, | |
| "grad_norm": 7.256553649902344, | |
| "learning_rate": 2.620232172470978e-07, | |
| "loss": 0.0847, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_accuracy": 0.9097570381797146, | |
| "eval_loss": 0.24851545691490173, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 115.2188, | |
| "eval_samples_per_second": 112.525, | |
| "eval_steps_per_second": 3.524, | |
| "step": 4560 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_accuracy": 0.9106054762822985, | |
| "eval_loss": 0.24626319110393524, | |
| "eval_model_preparation_time": 0.0056, | |
| "eval_runtime": 114.9847, | |
| "eval_samples_per_second": 112.754, | |
| "eval_steps_per_second": 3.531, | |
| "step": 4864 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 6080, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 20, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": false | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 2.4112003658884735e+19, | |
| "train_batch_size": 64, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |