{ "best_metric": 0.9176, "best_model_checkpoint": "./vit_finetuned_models_dataset/CIFAR100/50_from_100/google_vit-base-patch16-224/model_idx_0999/checkpoints/checkpoint-1332", "epoch": 4.0, "eval_steps": 500, "global_step": 1332, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": Infinity, "learning_rate": 0.0004271931404387096, "loss": 0.879, "step": 333 }, { "epoch": 1.0, "eval_accuracy": 0.824, "eval_loss": 0.6017924547195435, "eval_runtime": 7.2244, "eval_samples_per_second": 519.074, "eval_steps_per_second": 8.167, "step": 333 }, { "epoch": 2.0, "grad_norm": 27.124963760375977, "learning_rate": 0.00025058963771413845, "loss": 0.3896, "step": 666 }, { "epoch": 2.0, "eval_accuracy": 0.8669333333333333, "eval_loss": 0.47467219829559326, "eval_runtime": 7.2464, "eval_samples_per_second": 517.495, "eval_steps_per_second": 8.142, "step": 666 }, { "epoch": 3.0, "grad_norm": 1.388419270515442, "learning_rate": 7.36407332135117e-05, "loss": 0.131, "step": 999 }, { "epoch": 3.0, "eval_accuracy": 0.9021333333333333, "eval_loss": 0.3338121771812439, "eval_runtime": 7.1777, "eval_samples_per_second": 522.454, "eval_steps_per_second": 8.22, "step": 999 }, { "epoch": 4.0, "grad_norm": 0.13044586777687073, "learning_rate": 6.953462348691098e-10, "loss": 0.0284, "step": 1332 }, { "epoch": 4.0, "eval_accuracy": 0.9176, "eval_loss": 0.30562832951545715, "eval_runtime": 8.0981, "eval_samples_per_second": 463.074, "eval_steps_per_second": 7.286, "step": 1332 } ], "logging_steps": 500, "max_steps": 1332, "num_input_tokens_seen": 0, "num_train_epochs": 4, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 6.58965282490368e+18, "train_batch_size": 64, "trial_name": null, "trial_params": null }