| { | |
| "best_metric": 0.679702877998352, | |
| "best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/final_training_output/vit-base-patch16-224_rice-leaf-disease-augmented-v2_tl/checkpoint-1260", | |
| "epoch": 20.0, | |
| "eval_steps": 500, | |
| "global_step": 1260, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 2.9906086921691895, | |
| "learning_rate": 0.00015, | |
| "loss": 2.0152, | |
| "step": 63 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.3482142857142857, | |
| "eval_loss": 1.7805147171020508, | |
| "eval_runtime": 10.8133, | |
| "eval_samples_per_second": 31.073, | |
| "eval_steps_per_second": 0.277, | |
| "step": 63 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 2.7998437881469727, | |
| "learning_rate": 0.0003, | |
| "loss": 1.5405, | |
| "step": 126 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.6071428571428571, | |
| "eval_loss": 1.2886258363723755, | |
| "eval_runtime": 10.9701, | |
| "eval_samples_per_second": 30.629, | |
| "eval_steps_per_second": 0.273, | |
| "step": 126 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 2.3062703609466553, | |
| "learning_rate": 0.0002977211629518312, | |
| "loss": 1.128, | |
| "step": 189 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.6636904761904762, | |
| "eval_loss": 1.0534131526947021, | |
| "eval_runtime": 10.8915, | |
| "eval_samples_per_second": 30.85, | |
| "eval_steps_per_second": 0.275, | |
| "step": 189 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 1.7634103298187256, | |
| "learning_rate": 0.0002909538931178862, | |
| "loss": 0.9306, | |
| "step": 252 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.7113095238095238, | |
| "eval_loss": 0.9333988428115845, | |
| "eval_runtime": 15.3684, | |
| "eval_samples_per_second": 21.863, | |
| "eval_steps_per_second": 0.195, | |
| "step": 252 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 1.6794238090515137, | |
| "learning_rate": 0.0002799038105676658, | |
| "loss": 0.8207, | |
| "step": 315 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.7321428571428571, | |
| "eval_loss": 0.8421538472175598, | |
| "eval_runtime": 10.2428, | |
| "eval_samples_per_second": 32.804, | |
| "eval_steps_per_second": 0.293, | |
| "step": 315 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 1.8601257801055908, | |
| "learning_rate": 0.00026490666646784665, | |
| "loss": 0.7481, | |
| "step": 378 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.7113095238095238, | |
| "eval_loss": 0.810761034488678, | |
| "eval_runtime": 10.9444, | |
| "eval_samples_per_second": 30.701, | |
| "eval_steps_per_second": 0.274, | |
| "step": 378 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 1.816933512687683, | |
| "learning_rate": 0.0002464181414529809, | |
| "loss": 0.697, | |
| "step": 441 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.7410714285714286, | |
| "eval_loss": 0.7857556343078613, | |
| "eval_runtime": 10.3899, | |
| "eval_samples_per_second": 32.339, | |
| "eval_steps_per_second": 0.289, | |
| "step": 441 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 1.5066885948181152, | |
| "learning_rate": 0.000225, | |
| "loss": 0.6561, | |
| "step": 504 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.75, | |
| "eval_loss": 0.7553501129150391, | |
| "eval_runtime": 10.8989, | |
| "eval_samples_per_second": 30.829, | |
| "eval_steps_per_second": 0.275, | |
| "step": 504 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 1.7709600925445557, | |
| "learning_rate": 0.00020130302149885031, | |
| "loss": 0.626, | |
| "step": 567 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.75, | |
| "eval_loss": 0.7322452664375305, | |
| "eval_runtime": 10.5137, | |
| "eval_samples_per_second": 31.958, | |
| "eval_steps_per_second": 0.285, | |
| "step": 567 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 1.6905821561813354, | |
| "learning_rate": 0.00017604722665003956, | |
| "loss": 0.6015, | |
| "step": 630 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.7619047619047619, | |
| "eval_loss": 0.7166417241096497, | |
| "eval_runtime": 10.7548, | |
| "eval_samples_per_second": 31.242, | |
| "eval_steps_per_second": 0.279, | |
| "step": 630 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 1.7408339977264404, | |
| "learning_rate": 0.00015, | |
| "loss": 0.5818, | |
| "step": 693 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.7589285714285714, | |
| "eval_loss": 0.7089646458625793, | |
| "eval_runtime": 10.7618, | |
| "eval_samples_per_second": 31.222, | |
| "eval_steps_per_second": 0.279, | |
| "step": 693 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 1.5762419700622559, | |
| "learning_rate": 0.00012395277334996044, | |
| "loss": 0.5665, | |
| "step": 756 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.7589285714285714, | |
| "eval_loss": 0.6996546983718872, | |
| "eval_runtime": 10.7759, | |
| "eval_samples_per_second": 31.181, | |
| "eval_steps_per_second": 0.278, | |
| "step": 756 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "grad_norm": 2.082526922225952, | |
| "learning_rate": 9.869697850114969e-05, | |
| "loss": 0.5557, | |
| "step": 819 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_accuracy": 0.7589285714285714, | |
| "eval_loss": 0.6915065050125122, | |
| "eval_runtime": 10.9156, | |
| "eval_samples_per_second": 30.782, | |
| "eval_steps_per_second": 0.275, | |
| "step": 819 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "grad_norm": 1.8890206813812256, | |
| "learning_rate": 7.500000000000002e-05, | |
| "loss": 0.5458, | |
| "step": 882 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_accuracy": 0.7648809523809523, | |
| "eval_loss": 0.6875688433647156, | |
| "eval_runtime": 10.8297, | |
| "eval_samples_per_second": 31.026, | |
| "eval_steps_per_second": 0.277, | |
| "step": 882 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "grad_norm": 1.422352910041809, | |
| "learning_rate": 5.358185854701909e-05, | |
| "loss": 0.5378, | |
| "step": 945 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_accuracy": 0.7619047619047619, | |
| "eval_loss": 0.682266891002655, | |
| "eval_runtime": 10.7493, | |
| "eval_samples_per_second": 31.258, | |
| "eval_steps_per_second": 0.279, | |
| "step": 945 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "grad_norm": 1.3667608499526978, | |
| "learning_rate": 3.509333353215331e-05, | |
| "loss": 0.5335, | |
| "step": 1008 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_accuracy": 0.7678571428571429, | |
| "eval_loss": 0.6814180612564087, | |
| "eval_runtime": 10.6615, | |
| "eval_samples_per_second": 31.515, | |
| "eval_steps_per_second": 0.281, | |
| "step": 1008 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "grad_norm": 1.8170311450958252, | |
| "learning_rate": 2.009618943233419e-05, | |
| "loss": 0.5298, | |
| "step": 1071 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_accuracy": 0.7708333333333334, | |
| "eval_loss": 0.6809626817703247, | |
| "eval_runtime": 11.1963, | |
| "eval_samples_per_second": 30.01, | |
| "eval_steps_per_second": 0.268, | |
| "step": 1071 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "grad_norm": 1.4589533805847168, | |
| "learning_rate": 9.046106882113751e-06, | |
| "loss": 0.5277, | |
| "step": 1134 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_accuracy": 0.7708333333333334, | |
| "eval_loss": 0.6797568798065186, | |
| "eval_runtime": 11.3311, | |
| "eval_samples_per_second": 29.653, | |
| "eval_steps_per_second": 0.265, | |
| "step": 1134 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "grad_norm": 1.4728538990020752, | |
| "learning_rate": 2.2788370481687965e-06, | |
| "loss": 0.5264, | |
| "step": 1197 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_accuracy": 0.7708333333333334, | |
| "eval_loss": 0.6798648238182068, | |
| "eval_runtime": 10.4974, | |
| "eval_samples_per_second": 32.008, | |
| "eval_steps_per_second": 0.286, | |
| "step": 1197 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "grad_norm": 1.4680770635604858, | |
| "learning_rate": 0.0, | |
| "loss": 0.5265, | |
| "step": 1260 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_accuracy": 0.7708333333333334, | |
| "eval_loss": 0.679702877998352, | |
| "eval_runtime": 13.6697, | |
| "eval_samples_per_second": 24.58, | |
| "eval_steps_per_second": 0.219, | |
| "step": 1260 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "step": 1260, | |
| "total_flos": 1.239938509307904e+19, | |
| "train_loss": 0.759749530610584, | |
| "train_runtime": 5753.852, | |
| "train_samples_per_second": 27.807, | |
| "train_steps_per_second": 0.219 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 1260, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 20, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 1.239938509307904e+19, | |
| "train_batch_size": 128, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |