{ "best_metric": 0.8431372549019608, "best_model_checkpoint": "vit-base-patch16-224-RU9-24\\checkpoint-152", "epoch": 24.0, "eval_steps": 500, "global_step": 192, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.5098039215686274, "eval_loss": 1.340147614479065, "eval_runtime": 1.0273, "eval_samples_per_second": 49.646, "eval_steps_per_second": 1.947, "step": 8 }, { "epoch": 1.25, "learning_rate": 5.5e-05, "loss": 1.3685, "step": 10 }, { "epoch": 2.0, "eval_accuracy": 0.5686274509803921, "eval_loss": 1.219266653060913, "eval_runtime": 0.799, "eval_samples_per_second": 63.826, "eval_steps_per_second": 2.503, "step": 16 }, { "epoch": 2.5, "learning_rate": 5.197802197802198e-05, "loss": 1.2413, "step": 20 }, { "epoch": 3.0, "eval_accuracy": 0.5882352941176471, "eval_loss": 1.1150447130203247, "eval_runtime": 0.7843, "eval_samples_per_second": 65.03, "eval_steps_per_second": 2.55, "step": 24 }, { "epoch": 3.75, "learning_rate": 4.8956043956043954e-05, "loss": 1.1126, "step": 30 }, { "epoch": 4.0, "eval_accuracy": 0.7058823529411765, "eval_loss": 0.995692253112793, "eval_runtime": 0.8045, "eval_samples_per_second": 63.394, "eval_steps_per_second": 2.486, "step": 32 }, { "epoch": 5.0, "learning_rate": 4.593406593406594e-05, "loss": 0.9285, "step": 40 }, { "epoch": 5.0, "eval_accuracy": 0.6862745098039216, "eval_loss": 0.897616982460022, "eval_runtime": 0.7886, "eval_samples_per_second": 64.671, "eval_steps_per_second": 2.536, "step": 40 }, { "epoch": 6.0, "eval_accuracy": 0.6862745098039216, "eval_loss": 0.8579562306404114, "eval_runtime": 0.7809, "eval_samples_per_second": 65.312, "eval_steps_per_second": 2.561, "step": 48 }, { "epoch": 6.25, "learning_rate": 4.291208791208791e-05, "loss": 0.7793, "step": 50 }, { "epoch": 7.0, "eval_accuracy": 0.7647058823529411, "eval_loss": 0.8426423072814941, "eval_runtime": 0.7688, "eval_samples_per_second": 66.339, "eval_steps_per_second": 2.602, "step": 56 }, { "epoch": 7.5, "learning_rate": 3.989010989010989e-05, "loss": 0.6291, "step": 60 }, { "epoch": 8.0, "eval_accuracy": 0.6862745098039216, "eval_loss": 0.7899176478385925, "eval_runtime": 0.7937, "eval_samples_per_second": 64.258, "eval_steps_per_second": 2.52, "step": 64 }, { "epoch": 8.75, "learning_rate": 3.6868131868131865e-05, "loss": 0.5401, "step": 70 }, { "epoch": 9.0, "eval_accuracy": 0.7254901960784313, "eval_loss": 0.716878354549408, "eval_runtime": 0.7851, "eval_samples_per_second": 64.962, "eval_steps_per_second": 2.548, "step": 72 }, { "epoch": 10.0, "learning_rate": 3.384615384615385e-05, "loss": 0.4358, "step": 80 }, { "epoch": 10.0, "eval_accuracy": 0.7254901960784313, "eval_loss": 0.750454843044281, "eval_runtime": 0.7913, "eval_samples_per_second": 64.453, "eval_steps_per_second": 2.528, "step": 80 }, { "epoch": 11.0, "eval_accuracy": 0.7058823529411765, "eval_loss": 0.8076674342155457, "eval_runtime": 0.7751, "eval_samples_per_second": 65.797, "eval_steps_per_second": 2.58, "step": 88 }, { "epoch": 11.25, "learning_rate": 3.0824175824175825e-05, "loss": 0.3901, "step": 90 }, { "epoch": 12.0, "eval_accuracy": 0.7647058823529411, "eval_loss": 0.6802822351455688, "eval_runtime": 0.8054, "eval_samples_per_second": 63.325, "eval_steps_per_second": 2.483, "step": 96 }, { "epoch": 12.5, "learning_rate": 2.78021978021978e-05, "loss": 0.3033, "step": 100 }, { "epoch": 13.0, "eval_accuracy": 0.7647058823529411, "eval_loss": 0.6483149528503418, "eval_runtime": 0.7691, "eval_samples_per_second": 66.31, "eval_steps_per_second": 2.6, "step": 104 }, { "epoch": 13.75, "learning_rate": 2.478021978021978e-05, "loss": 0.267, "step": 110 }, { "epoch": 14.0, "eval_accuracy": 0.7450980392156863, "eval_loss": 0.6450825333595276, "eval_runtime": 0.8121, "eval_samples_per_second": 62.802, "eval_steps_per_second": 2.463, "step": 112 }, { "epoch": 15.0, "learning_rate": 2.175824175824176e-05, "loss": 0.2212, "step": 120 }, { "epoch": 15.0, "eval_accuracy": 0.7647058823529411, "eval_loss": 0.6118857264518738, "eval_runtime": 0.7703, "eval_samples_per_second": 66.211, "eval_steps_per_second": 2.597, "step": 120 }, { "epoch": 16.0, "eval_accuracy": 0.803921568627451, "eval_loss": 0.614970326423645, "eval_runtime": 0.7768, "eval_samples_per_second": 65.657, "eval_steps_per_second": 2.575, "step": 128 }, { "epoch": 16.25, "learning_rate": 1.873626373626374e-05, "loss": 0.2206, "step": 130 }, { "epoch": 17.0, "eval_accuracy": 0.7843137254901961, "eval_loss": 0.6270039081573486, "eval_runtime": 0.8131, "eval_samples_per_second": 62.722, "eval_steps_per_second": 2.46, "step": 136 }, { "epoch": 17.5, "learning_rate": 1.5714285714285715e-05, "loss": 0.2285, "step": 140 }, { "epoch": 18.0, "eval_accuracy": 0.7647058823529411, "eval_loss": 0.6181018352508545, "eval_runtime": 0.7654, "eval_samples_per_second": 66.634, "eval_steps_per_second": 2.613, "step": 144 }, { "epoch": 18.75, "learning_rate": 1.2692307692307693e-05, "loss": 0.1741, "step": 150 }, { "epoch": 19.0, "eval_accuracy": 0.8431372549019608, "eval_loss": 0.5081135630607605, "eval_runtime": 0.7922, "eval_samples_per_second": 64.379, "eval_steps_per_second": 2.525, "step": 152 }, { "epoch": 20.0, "learning_rate": 9.670329670329671e-06, "loss": 0.1708, "step": 160 }, { "epoch": 20.0, "eval_accuracy": 0.8235294117647058, "eval_loss": 0.5501907467842102, "eval_runtime": 0.7732, "eval_samples_per_second": 65.96, "eval_steps_per_second": 2.587, "step": 160 }, { "epoch": 21.0, "eval_accuracy": 0.803921568627451, "eval_loss": 0.5689105987548828, "eval_runtime": 0.7988, "eval_samples_per_second": 63.843, "eval_steps_per_second": 2.504, "step": 168 }, { "epoch": 21.25, "learning_rate": 6.648351648351649e-06, "loss": 0.16, "step": 170 }, { "epoch": 22.0, "eval_accuracy": 0.8235294117647058, "eval_loss": 0.5137497186660767, "eval_runtime": 0.7803, "eval_samples_per_second": 65.361, "eval_steps_per_second": 2.563, "step": 176 }, { "epoch": 22.5, "learning_rate": 3.6263736263736266e-06, "loss": 0.1567, "step": 180 }, { "epoch": 23.0, "eval_accuracy": 0.8431372549019608, "eval_loss": 0.5207127332687378, "eval_runtime": 0.7678, "eval_samples_per_second": 66.422, "eval_steps_per_second": 2.605, "step": 184 }, { "epoch": 23.75, "learning_rate": 6.043956043956044e-07, "loss": 0.1616, "step": 190 }, { "epoch": 24.0, "eval_accuracy": 0.8235294117647058, "eval_loss": 0.5374550223350525, "eval_runtime": 0.821, "eval_samples_per_second": 62.116, "eval_steps_per_second": 2.436, "step": 192 }, { "epoch": 24.0, "step": 192, "total_flos": 1.8877387048147354e+18, "train_loss": 0.4960318058729172, "train_runtime": 413.057, "train_samples_per_second": 58.975, "train_steps_per_second": 0.465 } ], "logging_steps": 10, "max_steps": 192, "num_input_tokens_seen": 0, "num_train_epochs": 24, "save_steps": 500, "total_flos": 1.8877387048147354e+18, "train_batch_size": 32, "trial_name": null, "trial_params": null }