| { | |
| "best_metric": 0.8090909090909091, | |
| "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-Diabetic-Retinopathy\\checkpoint-110", | |
| "epoch": 40.0, | |
| "eval_steps": 500, | |
| "global_step": 200, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.4909090909090909, | |
| "eval_loss": 1.6053773164749146, | |
| "eval_runtime": 1.1664, | |
| "eval_samples_per_second": 94.304, | |
| "eval_steps_per_second": 3.429, | |
| "step": 5 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 2.5e-05, | |
| "loss": 1.6039, | |
| "step": 10 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.4909090909090909, | |
| "eval_loss": 1.577444314956665, | |
| "eval_runtime": 0.6246, | |
| "eval_samples_per_second": 176.117, | |
| "eval_steps_per_second": 6.404, | |
| "step": 10 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.4909090909090909, | |
| "eval_loss": 1.4627095460891724, | |
| "eval_runtime": 0.6237, | |
| "eval_samples_per_second": 176.372, | |
| "eval_steps_per_second": 6.414, | |
| "step": 15 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 5e-05, | |
| "loss": 1.4766, | |
| "step": 20 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.4909090909090909, | |
| "eval_loss": 1.3211016654968262, | |
| "eval_runtime": 0.5963, | |
| "eval_samples_per_second": 184.459, | |
| "eval_steps_per_second": 6.708, | |
| "step": 20 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.4909090909090909, | |
| "eval_loss": 1.2294203042984009, | |
| "eval_runtime": 0.6045, | |
| "eval_samples_per_second": 181.978, | |
| "eval_steps_per_second": 6.617, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "learning_rate": 4.722222222222222e-05, | |
| "loss": 1.2308, | |
| "step": 30 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.4909090909090909, | |
| "eval_loss": 1.0656994581222534, | |
| "eval_runtime": 0.6274, | |
| "eval_samples_per_second": 175.336, | |
| "eval_steps_per_second": 6.376, | |
| "step": 30 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.6545454545454545, | |
| "eval_loss": 0.9504080414772034, | |
| "eval_runtime": 0.6116, | |
| "eval_samples_per_second": 179.842, | |
| "eval_steps_per_second": 6.54, | |
| "step": 35 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 4.4444444444444447e-05, | |
| "loss": 1.017, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.7363636363636363, | |
| "eval_loss": 0.8463379740715027, | |
| "eval_runtime": 0.6133, | |
| "eval_samples_per_second": 179.362, | |
| "eval_steps_per_second": 6.522, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.7454545454545455, | |
| "eval_loss": 0.7462926506996155, | |
| "eval_runtime": 0.6373, | |
| "eval_samples_per_second": 172.596, | |
| "eval_steps_per_second": 6.276, | |
| "step": 45 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "learning_rate": 4.166666666666667e-05, | |
| "loss": 0.8345, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.7454545454545455, | |
| "eval_loss": 0.6947882771492004, | |
| "eval_runtime": 0.6097, | |
| "eval_samples_per_second": 180.42, | |
| "eval_steps_per_second": 6.561, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.7545454545454545, | |
| "eval_loss": 0.6460423469543457, | |
| "eval_runtime": 0.6052, | |
| "eval_samples_per_second": 181.744, | |
| "eval_steps_per_second": 6.609, | |
| "step": 55 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "learning_rate": 3.888888888888889e-05, | |
| "loss": 0.7594, | |
| "step": 60 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.7545454545454545, | |
| "eval_loss": 0.6403194069862366, | |
| "eval_runtime": 0.6016, | |
| "eval_samples_per_second": 182.831, | |
| "eval_steps_per_second": 6.648, | |
| "step": 60 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_accuracy": 0.7545454545454545, | |
| "eval_loss": 0.631945788860321, | |
| "eval_runtime": 0.6046, | |
| "eval_samples_per_second": 181.926, | |
| "eval_steps_per_second": 6.615, | |
| "step": 65 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "learning_rate": 3.611111111111111e-05, | |
| "loss": 0.7228, | |
| "step": 70 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_accuracy": 0.7454545454545455, | |
| "eval_loss": 0.5999094843864441, | |
| "eval_runtime": 0.6056, | |
| "eval_samples_per_second": 181.624, | |
| "eval_steps_per_second": 6.605, | |
| "step": 70 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_accuracy": 0.7545454545454545, | |
| "eval_loss": 0.5922093391418457, | |
| "eval_runtime": 0.5972, | |
| "eval_samples_per_second": 184.202, | |
| "eval_steps_per_second": 6.698, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "learning_rate": 3.3333333333333335e-05, | |
| "loss": 0.6851, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_accuracy": 0.7636363636363637, | |
| "eval_loss": 0.5955119132995605, | |
| "eval_runtime": 0.6011, | |
| "eval_samples_per_second": 182.985, | |
| "eval_steps_per_second": 6.654, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_accuracy": 0.7545454545454545, | |
| "eval_loss": 0.573071300983429, | |
| "eval_runtime": 0.6051, | |
| "eval_samples_per_second": 181.777, | |
| "eval_steps_per_second": 6.61, | |
| "step": 85 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "learning_rate": 3.055555555555556e-05, | |
| "loss": 0.6549, | |
| "step": 90 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_accuracy": 0.7818181818181819, | |
| "eval_loss": 0.5602535605430603, | |
| "eval_runtime": 0.7062, | |
| "eval_samples_per_second": 155.768, | |
| "eval_steps_per_second": 5.664, | |
| "step": 90 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_accuracy": 0.7818181818181819, | |
| "eval_loss": 0.5386339426040649, | |
| "eval_runtime": 0.6221, | |
| "eval_samples_per_second": 176.809, | |
| "eval_steps_per_second": 6.429, | |
| "step": 95 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "learning_rate": 2.777777777777778e-05, | |
| "loss": 0.643, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_accuracy": 0.7727272727272727, | |
| "eval_loss": 0.5423626899719238, | |
| "eval_runtime": 0.6072, | |
| "eval_samples_per_second": 181.171, | |
| "eval_steps_per_second": 6.588, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.5295349955558777, | |
| "eval_runtime": 0.6772, | |
| "eval_samples_per_second": 162.427, | |
| "eval_steps_per_second": 5.906, | |
| "step": 105 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.5951, | |
| "step": 110 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_accuracy": 0.8090909090909091, | |
| "eval_loss": 0.5203222036361694, | |
| "eval_runtime": 0.6067, | |
| "eval_samples_per_second": 181.322, | |
| "eval_steps_per_second": 6.594, | |
| "step": 110 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.516213059425354, | |
| "eval_runtime": 0.6272, | |
| "eval_samples_per_second": 175.393, | |
| "eval_steps_per_second": 6.378, | |
| "step": 115 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "learning_rate": 2.2222222222222223e-05, | |
| "loss": 0.5913, | |
| "step": 120 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_accuracy": 0.7818181818181819, | |
| "eval_loss": 0.5094789862632751, | |
| "eval_runtime": 0.6677, | |
| "eval_samples_per_second": 164.747, | |
| "eval_steps_per_second": 5.991, | |
| "step": 120 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.5140318870544434, | |
| "eval_runtime": 0.6572, | |
| "eval_samples_per_second": 167.374, | |
| "eval_steps_per_second": 6.086, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "learning_rate": 1.9444444444444445e-05, | |
| "loss": 0.5462, | |
| "step": 130 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_accuracy": 0.7636363636363637, | |
| "eval_loss": 0.5167139768600464, | |
| "eval_runtime": 0.7442, | |
| "eval_samples_per_second": 147.801, | |
| "eval_steps_per_second": 5.375, | |
| "step": 130 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.49426034092903137, | |
| "eval_runtime": 0.6102, | |
| "eval_samples_per_second": 180.278, | |
| "eval_steps_per_second": 6.556, | |
| "step": 135 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "learning_rate": 1.6666666666666667e-05, | |
| "loss": 0.5538, | |
| "step": 140 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_accuracy": 0.7636363636363637, | |
| "eval_loss": 0.4843919575214386, | |
| "eval_runtime": 0.7542, | |
| "eval_samples_per_second": 145.854, | |
| "eval_steps_per_second": 5.304, | |
| "step": 140 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_accuracy": 0.7727272727272727, | |
| "eval_loss": 0.4821490943431854, | |
| "eval_runtime": 0.6238, | |
| "eval_samples_per_second": 176.347, | |
| "eval_steps_per_second": 6.413, | |
| "step": 145 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "learning_rate": 1.388888888888889e-05, | |
| "loss": 0.5497, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_accuracy": 0.7727272727272727, | |
| "eval_loss": 0.49517491459846497, | |
| "eval_runtime": 0.6867, | |
| "eval_samples_per_second": 160.188, | |
| "eval_steps_per_second": 5.825, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "eval_accuracy": 0.7818181818181819, | |
| "eval_loss": 0.499459445476532, | |
| "eval_runtime": 0.6542, | |
| "eval_samples_per_second": 168.144, | |
| "eval_steps_per_second": 6.114, | |
| "step": 155 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "learning_rate": 1.1111111111111112e-05, | |
| "loss": 0.4923, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "eval_accuracy": 0.7727272727272727, | |
| "eval_loss": 0.4910464286804199, | |
| "eval_runtime": 0.6079, | |
| "eval_samples_per_second": 180.941, | |
| "eval_steps_per_second": 6.58, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "eval_accuracy": 0.7818181818181819, | |
| "eval_loss": 0.5028622150421143, | |
| "eval_runtime": 0.6106, | |
| "eval_samples_per_second": 180.138, | |
| "eval_steps_per_second": 6.55, | |
| "step": 165 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "learning_rate": 8.333333333333334e-06, | |
| "loss": 0.5228, | |
| "step": 170 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "eval_accuracy": 0.7818181818181819, | |
| "eval_loss": 0.5083434581756592, | |
| "eval_runtime": 0.6097, | |
| "eval_samples_per_second": 180.422, | |
| "eval_steps_per_second": 6.561, | |
| "step": 170 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.49842116236686707, | |
| "eval_runtime": 0.6153, | |
| "eval_samples_per_second": 178.786, | |
| "eval_steps_per_second": 6.501, | |
| "step": 175 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "learning_rate": 5.555555555555556e-06, | |
| "loss": 0.4986, | |
| "step": 180 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.4914481043815613, | |
| "eval_runtime": 0.6407, | |
| "eval_samples_per_second": 171.693, | |
| "eval_steps_per_second": 6.243, | |
| "step": 180 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "eval_accuracy": 0.7909090909090909, | |
| "eval_loss": 0.4926435649394989, | |
| "eval_runtime": 0.6131, | |
| "eval_samples_per_second": 179.402, | |
| "eval_steps_per_second": 6.524, | |
| "step": 185 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "learning_rate": 2.777777777777778e-06, | |
| "loss": 0.5154, | |
| "step": 190 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "eval_accuracy": 0.8, | |
| "eval_loss": 0.49148377776145935, | |
| "eval_runtime": 0.6154, | |
| "eval_samples_per_second": 178.737, | |
| "eval_steps_per_second": 6.5, | |
| "step": 190 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "eval_accuracy": 0.8, | |
| "eval_loss": 0.4885866641998291, | |
| "eval_runtime": 0.636, | |
| "eval_samples_per_second": 172.961, | |
| "eval_steps_per_second": 6.289, | |
| "step": 195 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "learning_rate": 0.0, | |
| "loss": 0.5081, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "eval_accuracy": 0.8, | |
| "eval_loss": 0.48748189210891724, | |
| "eval_runtime": 0.5972, | |
| "eval_samples_per_second": 184.204, | |
| "eval_steps_per_second": 6.698, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "step": 200, | |
| "total_flos": 8.108232849122918e+17, | |
| "train_loss": 0.750064127445221, | |
| "train_runtime": 356.9379, | |
| "train_samples_per_second": 69.816, | |
| "train_steps_per_second": 0.56 | |
| } | |
| ], | |
| "logging_steps": 10, | |
| "max_steps": 200, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 40, | |
| "save_steps": 500, | |
| "total_flos": 8.108232849122918e+17, | |
| "train_batch_size": 32, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |