{ "best_metric": 0.8453333333333334, "best_model_checkpoint": "./vit_finetuned_models_dataset/CIFAR100/50_from_100/facebook_dino-vitb16/model_idx_0702/checkpoints/checkpoint-2664", "epoch": 8.0, "eval_steps": 500, "global_step": 2664, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": Infinity, "learning_rate": 0.0001, "loss": 0.946, "step": 333 }, { "epoch": 1.0, "eval_accuracy": 0.8112, "eval_loss": 0.6392398476600647, "eval_runtime": 13.3762, "eval_samples_per_second": 280.349, "eval_steps_per_second": 4.411, "step": 333 }, { "epoch": 2.0, "grad_norm": 1.4604071378707886, "learning_rate": 0.0001, "loss": 0.4005, "step": 666 }, { "epoch": 2.0, "eval_accuracy": 0.8317333333333333, "eval_loss": 0.5749013423919678, "eval_runtime": 13.2989, "eval_samples_per_second": 281.978, "eval_steps_per_second": 4.436, "step": 666 }, { "epoch": 3.0, "grad_norm": 63.05999755859375, "learning_rate": 0.0001, "loss": 0.2805, "step": 999 }, { "epoch": 3.0, "eval_accuracy": 0.8424, "eval_loss": 0.5639004111289978, "eval_runtime": 13.2901, "eval_samples_per_second": 282.164, "eval_steps_per_second": 4.439, "step": 999 }, { "epoch": 4.0, "grad_norm": 1.2397186756134033, "learning_rate": 0.0001, "loss": 0.2086, "step": 1332 }, { "epoch": 4.0, "eval_accuracy": 0.8304, "eval_loss": 0.6406498551368713, "eval_runtime": 13.3441, "eval_samples_per_second": 281.023, "eval_steps_per_second": 4.421, "step": 1332 }, { "epoch": 5.0, "grad_norm": 7.314879894256592, "learning_rate": 0.0001, "loss": 0.1665, "step": 1665 }, { "epoch": 5.0, "eval_accuracy": 0.828, "eval_loss": 0.6785334348678589, "eval_runtime": 13.5021, "eval_samples_per_second": 277.736, "eval_steps_per_second": 4.37, "step": 1665 }, { "epoch": 6.0, "grad_norm": 0.034189701080322266, "learning_rate": 0.0001, "loss": 0.1587, "step": 1998 }, { "epoch": 6.0, "eval_accuracy": 0.8392, "eval_loss": 0.631488561630249, "eval_runtime": 13.4094, "eval_samples_per_second": 279.654, "eval_steps_per_second": 4.4, "step": 1998 }, { "epoch": 7.0, "grad_norm": 33.375999450683594, "learning_rate": 0.0001, "loss": 0.132, "step": 2331 }, { "epoch": 7.0, "eval_accuracy": 0.8232, "eval_loss": 0.7299953103065491, "eval_runtime": 13.4099, "eval_samples_per_second": 279.643, "eval_steps_per_second": 4.4, "step": 2331 }, { "epoch": 8.0, "grad_norm": 8.396727561950684, "learning_rate": 0.0001, "loss": 0.1319, "step": 2664 }, { "epoch": 8.0, "eval_accuracy": 0.8453333333333334, "eval_loss": 0.6151342391967773, "eval_runtime": 13.9753, "eval_samples_per_second": 268.331, "eval_steps_per_second": 4.222, "step": 2664 } ], "logging_steps": 500, "max_steps": 2997, "num_input_tokens_seen": 0, "num_train_epochs": 9, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.317930564980736e+19, "train_batch_size": 64, "trial_name": null, "trial_params": null }