{ "best_metric": 0.8986666666666666, "best_model_checkpoint": "./vit_finetuned_models_dataset/CIFAR100/50_from_100/facebook_dino-vitb16/model_idx_0212/checkpoints/checkpoint-1998", "epoch": 6.0, "eval_steps": 500, "global_step": 1998, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 13.115069389343262, "learning_rate": 8.343343343343344e-05, "loss": 1.039, "step": 333 }, { "epoch": 1.0, "eval_accuracy": 0.8032, "eval_loss": 0.627038300037384, "eval_runtime": 6.8444, "eval_samples_per_second": 547.892, "eval_steps_per_second": 8.62, "step": 333 }, { "epoch": 2.0, "grad_norm": 6.182191371917725, "learning_rate": 6.676676676676677e-05, "loss": 0.3372, "step": 666 }, { "epoch": 2.0, "eval_accuracy": 0.836, "eval_loss": 0.5417731404304504, "eval_runtime": 6.8702, "eval_samples_per_second": 545.834, "eval_steps_per_second": 8.588, "step": 666 }, { "epoch": 3.0, "grad_norm": 6.243861198425293, "learning_rate": 5.01001001001001e-05, "loss": 0.1551, "step": 999 }, { "epoch": 3.0, "eval_accuracy": 0.8610666666666666, "eval_loss": 0.5183677077293396, "eval_runtime": 6.5151, "eval_samples_per_second": 575.585, "eval_steps_per_second": 9.056, "step": 999 }, { "epoch": 4.0, "grad_norm": 0.2019670605659485, "learning_rate": 3.3433433433433435e-05, "loss": 0.0714, "step": 1332 }, { "epoch": 4.0, "eval_accuracy": 0.8704, "eval_loss": 0.4896680414676666, "eval_runtime": 6.8187, "eval_samples_per_second": 549.96, "eval_steps_per_second": 8.653, "step": 1332 }, { "epoch": 5.0, "grad_norm": 0.13753890991210938, "learning_rate": 1.6766766766766767e-05, "loss": 0.0232, "step": 1665 }, { "epoch": 5.0, "eval_accuracy": 0.888, "eval_loss": 0.45525020360946655, "eval_runtime": 6.2762, "eval_samples_per_second": 597.499, "eval_steps_per_second": 9.401, "step": 1665 }, { "epoch": 6.0, "grad_norm": 0.3573720455169678, "learning_rate": 1.001001001001001e-07, "loss": 0.0043, "step": 1998 }, { "epoch": 6.0, "eval_accuracy": 0.8986666666666666, "eval_loss": 0.40733274817466736, "eval_runtime": 6.1866, "eval_samples_per_second": 606.146, "eval_steps_per_second": 9.537, "step": 1998 } ], "logging_steps": 500, "max_steps": 1998, "num_input_tokens_seen": 0, "num_train_epochs": 6, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 9.88447923735552e+18, "train_batch_size": 64, "trial_name": null, "trial_params": null }