{ "best_metric": 0.679702877998352, "best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/final_training_output/vit-base-patch16-224_rice-leaf-disease-augmented-v2_tl/checkpoint-1260", "epoch": 20.0, "eval_steps": 500, "global_step": 1260, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.9906086921691895, "learning_rate": 0.00015, "loss": 2.0152, "step": 63 }, { "epoch": 1.0, "eval_accuracy": 0.3482142857142857, "eval_loss": 1.7805147171020508, "eval_runtime": 10.8133, "eval_samples_per_second": 31.073, "eval_steps_per_second": 0.277, "step": 63 }, { "epoch": 2.0, "grad_norm": 2.7998437881469727, "learning_rate": 0.0003, "loss": 1.5405, "step": 126 }, { "epoch": 2.0, "eval_accuracy": 0.6071428571428571, "eval_loss": 1.2886258363723755, "eval_runtime": 10.9701, "eval_samples_per_second": 30.629, "eval_steps_per_second": 0.273, "step": 126 }, { "epoch": 3.0, "grad_norm": 2.3062703609466553, "learning_rate": 0.0002977211629518312, "loss": 1.128, "step": 189 }, { "epoch": 3.0, "eval_accuracy": 0.6636904761904762, "eval_loss": 1.0534131526947021, "eval_runtime": 10.8915, "eval_samples_per_second": 30.85, "eval_steps_per_second": 0.275, "step": 189 }, { "epoch": 4.0, "grad_norm": 1.7634103298187256, "learning_rate": 0.0002909538931178862, "loss": 0.9306, "step": 252 }, { "epoch": 4.0, "eval_accuracy": 0.7113095238095238, "eval_loss": 0.9333988428115845, "eval_runtime": 15.3684, "eval_samples_per_second": 21.863, "eval_steps_per_second": 0.195, "step": 252 }, { "epoch": 5.0, "grad_norm": 1.6794238090515137, "learning_rate": 0.0002799038105676658, "loss": 0.8207, "step": 315 }, { "epoch": 5.0, "eval_accuracy": 0.7321428571428571, "eval_loss": 0.8421538472175598, "eval_runtime": 10.2428, "eval_samples_per_second": 32.804, "eval_steps_per_second": 0.293, "step": 315 }, { "epoch": 6.0, "grad_norm": 1.8601257801055908, "learning_rate": 0.00026490666646784665, "loss": 0.7481, "step": 378 }, { "epoch": 6.0, "eval_accuracy": 0.7113095238095238, "eval_loss": 0.810761034488678, "eval_runtime": 10.9444, "eval_samples_per_second": 30.701, "eval_steps_per_second": 0.274, "step": 378 }, { "epoch": 7.0, "grad_norm": 1.816933512687683, "learning_rate": 0.0002464181414529809, "loss": 0.697, "step": 441 }, { "epoch": 7.0, "eval_accuracy": 0.7410714285714286, "eval_loss": 0.7857556343078613, "eval_runtime": 10.3899, "eval_samples_per_second": 32.339, "eval_steps_per_second": 0.289, "step": 441 }, { "epoch": 8.0, "grad_norm": 1.5066885948181152, "learning_rate": 0.000225, "loss": 0.6561, "step": 504 }, { "epoch": 8.0, "eval_accuracy": 0.75, "eval_loss": 0.7553501129150391, "eval_runtime": 10.8989, "eval_samples_per_second": 30.829, "eval_steps_per_second": 0.275, "step": 504 }, { "epoch": 9.0, "grad_norm": 1.7709600925445557, "learning_rate": 0.00020130302149885031, "loss": 0.626, "step": 567 }, { "epoch": 9.0, "eval_accuracy": 0.75, "eval_loss": 0.7322452664375305, "eval_runtime": 10.5137, "eval_samples_per_second": 31.958, "eval_steps_per_second": 0.285, "step": 567 }, { "epoch": 10.0, "grad_norm": 1.6905821561813354, "learning_rate": 0.00017604722665003956, "loss": 0.6015, "step": 630 }, { "epoch": 10.0, "eval_accuracy": 0.7619047619047619, "eval_loss": 0.7166417241096497, "eval_runtime": 10.7548, "eval_samples_per_second": 31.242, "eval_steps_per_second": 0.279, "step": 630 }, { "epoch": 11.0, "grad_norm": 1.7408339977264404, "learning_rate": 0.00015, "loss": 0.5818, "step": 693 }, { "epoch": 11.0, "eval_accuracy": 0.7589285714285714, "eval_loss": 0.7089646458625793, "eval_runtime": 10.7618, "eval_samples_per_second": 31.222, "eval_steps_per_second": 0.279, "step": 693 }, { "epoch": 12.0, "grad_norm": 1.5762419700622559, "learning_rate": 0.00012395277334996044, "loss": 0.5665, "step": 756 }, { "epoch": 12.0, "eval_accuracy": 0.7589285714285714, "eval_loss": 0.6996546983718872, "eval_runtime": 10.7759, "eval_samples_per_second": 31.181, "eval_steps_per_second": 0.278, "step": 756 }, { "epoch": 13.0, "grad_norm": 2.082526922225952, "learning_rate": 9.869697850114969e-05, "loss": 0.5557, "step": 819 }, { "epoch": 13.0, "eval_accuracy": 0.7589285714285714, "eval_loss": 0.6915065050125122, "eval_runtime": 10.9156, "eval_samples_per_second": 30.782, "eval_steps_per_second": 0.275, "step": 819 }, { "epoch": 14.0, "grad_norm": 1.8890206813812256, "learning_rate": 7.500000000000002e-05, "loss": 0.5458, "step": 882 }, { "epoch": 14.0, "eval_accuracy": 0.7648809523809523, "eval_loss": 0.6875688433647156, "eval_runtime": 10.8297, "eval_samples_per_second": 31.026, "eval_steps_per_second": 0.277, "step": 882 }, { "epoch": 15.0, "grad_norm": 1.422352910041809, "learning_rate": 5.358185854701909e-05, "loss": 0.5378, "step": 945 }, { "epoch": 15.0, "eval_accuracy": 0.7619047619047619, "eval_loss": 0.682266891002655, "eval_runtime": 10.7493, "eval_samples_per_second": 31.258, "eval_steps_per_second": 0.279, "step": 945 }, { "epoch": 16.0, "grad_norm": 1.3667608499526978, "learning_rate": 3.509333353215331e-05, "loss": 0.5335, "step": 1008 }, { "epoch": 16.0, "eval_accuracy": 0.7678571428571429, "eval_loss": 0.6814180612564087, "eval_runtime": 10.6615, "eval_samples_per_second": 31.515, "eval_steps_per_second": 0.281, "step": 1008 }, { "epoch": 17.0, "grad_norm": 1.8170311450958252, "learning_rate": 2.009618943233419e-05, "loss": 0.5298, "step": 1071 }, { "epoch": 17.0, "eval_accuracy": 0.7708333333333334, "eval_loss": 0.6809626817703247, "eval_runtime": 11.1963, "eval_samples_per_second": 30.01, "eval_steps_per_second": 0.268, "step": 1071 }, { "epoch": 18.0, "grad_norm": 1.4589533805847168, "learning_rate": 9.046106882113751e-06, "loss": 0.5277, "step": 1134 }, { "epoch": 18.0, "eval_accuracy": 0.7708333333333334, "eval_loss": 0.6797568798065186, "eval_runtime": 11.3311, "eval_samples_per_second": 29.653, "eval_steps_per_second": 0.265, "step": 1134 }, { "epoch": 19.0, "grad_norm": 1.4728538990020752, "learning_rate": 2.2788370481687965e-06, "loss": 0.5264, "step": 1197 }, { "epoch": 19.0, "eval_accuracy": 0.7708333333333334, "eval_loss": 0.6798648238182068, "eval_runtime": 10.4974, "eval_samples_per_second": 32.008, "eval_steps_per_second": 0.286, "step": 1197 }, { "epoch": 20.0, "grad_norm": 1.4680770635604858, "learning_rate": 0.0, "loss": 0.5265, "step": 1260 }, { "epoch": 20.0, "eval_accuracy": 0.7708333333333334, "eval_loss": 0.679702877998352, "eval_runtime": 13.6697, "eval_samples_per_second": 24.58, "eval_steps_per_second": 0.219, "step": 1260 }, { "epoch": 20.0, "step": 1260, "total_flos": 1.239938509307904e+19, "train_loss": 0.759749530610584, "train_runtime": 5753.852, "train_samples_per_second": 27.807, "train_steps_per_second": 0.219 } ], "logging_steps": 500, "max_steps": 1260, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.239938509307904e+19, "train_batch_size": 128, "trial_name": null, "trial_params": null }