| { | |
| "best_metric": 0.7191632129465166, | |
| "best_model_checkpoint": "Distilled-Melanoma-Classification-ResNet/checkpoint-63325", | |
| "epoch": 29.0, | |
| "eval_steps": 500, | |
| "global_step": 73457, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 4.8333333333333334e-05, | |
| "loss": 1.8178, | |
| "step": 2533 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.5569370436155516, | |
| "eval_loss": 1.4635199308395386, | |
| "eval_runtime": 443.0799, | |
| "eval_samples_per_second": 11.436, | |
| "eval_steps_per_second": 1.431, | |
| "step": 2533 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 4.666666666666667e-05, | |
| "loss": 1.5613, | |
| "step": 5066 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.6009473060982831, | |
| "eval_loss": 1.3275712728500366, | |
| "eval_runtime": 450.6621, | |
| "eval_samples_per_second": 11.243, | |
| "eval_steps_per_second": 1.407, | |
| "step": 5066 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 4.5e-05, | |
| "loss": 1.4093, | |
| "step": 7599 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.6279850009867772, | |
| "eval_loss": 1.2198262214660645, | |
| "eval_runtime": 455.8599, | |
| "eval_samples_per_second": 11.115, | |
| "eval_steps_per_second": 1.391, | |
| "step": 7599 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 4.3333333333333334e-05, | |
| "loss": 1.2938, | |
| "step": 10132 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.6360765739096113, | |
| "eval_loss": 1.2061253786087036, | |
| "eval_runtime": 457.5927, | |
| "eval_samples_per_second": 11.073, | |
| "eval_steps_per_second": 1.386, | |
| "step": 10132 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 4.166666666666667e-05, | |
| "loss": 1.2145, | |
| "step": 12665 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.640615748963884, | |
| "eval_loss": 1.102392554283142, | |
| "eval_runtime": 461.4922, | |
| "eval_samples_per_second": 10.98, | |
| "eval_steps_per_second": 1.374, | |
| "step": 12665 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "learning_rate": 4e-05, | |
| "loss": 1.143, | |
| "step": 15198 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.6682455101638051, | |
| "eval_loss": 1.0069061517715454, | |
| "eval_runtime": 464.3259, | |
| "eval_samples_per_second": 10.913, | |
| "eval_steps_per_second": 1.365, | |
| "step": 15198 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "learning_rate": 3.8333333333333334e-05, | |
| "loss": 1.065, | |
| "step": 17731 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.6714031971580817, | |
| "eval_loss": 1.0104970932006836, | |
| "eval_runtime": 464.529, | |
| "eval_samples_per_second": 10.908, | |
| "eval_steps_per_second": 1.365, | |
| "step": 17731 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 3.6666666666666666e-05, | |
| "loss": 0.9922, | |
| "step": 20264 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.6741661732780738, | |
| "eval_loss": 1.0025968551635742, | |
| "eval_runtime": 465.5511, | |
| "eval_samples_per_second": 10.884, | |
| "eval_steps_per_second": 1.362, | |
| "step": 20264 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.8981, | |
| "step": 22797 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.6893625419380304, | |
| "eval_loss": 0.9656845331192017, | |
| "eval_runtime": 467.5026, | |
| "eval_samples_per_second": 10.838, | |
| "eval_steps_per_second": 1.356, | |
| "step": 22797 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "learning_rate": 3.3333333333333335e-05, | |
| "loss": 0.8036, | |
| "step": 25330 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.6883757647523189, | |
| "eval_loss": 0.9617614150047302, | |
| "eval_runtime": 460.7588, | |
| "eval_samples_per_second": 10.997, | |
| "eval_steps_per_second": 1.376, | |
| "step": 25330 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "learning_rate": 3.1666666666666666e-05, | |
| "loss": 0.6933, | |
| "step": 27863 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.6964673376751529, | |
| "eval_loss": 0.9330915212631226, | |
| "eval_runtime": 457.9554, | |
| "eval_samples_per_second": 11.064, | |
| "eval_steps_per_second": 1.384, | |
| "step": 27863 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "learning_rate": 3e-05, | |
| "loss": 0.5867, | |
| "step": 30396 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.6954805604894415, | |
| "eval_loss": 0.9513295292854309, | |
| "eval_runtime": 460.1198, | |
| "eval_samples_per_second": 11.012, | |
| "eval_steps_per_second": 1.378, | |
| "step": 30396 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "learning_rate": 2.8333333333333335e-05, | |
| "loss": 0.4942, | |
| "step": 32929 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_accuracy": 0.7051509769094139, | |
| "eval_loss": 0.9170295596122742, | |
| "eval_runtime": 461.0234, | |
| "eval_samples_per_second": 10.991, | |
| "eval_steps_per_second": 1.375, | |
| "step": 32929 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "learning_rate": 2.6666666666666667e-05, | |
| "loss": 0.4175, | |
| "step": 35462 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_accuracy": 0.7053483323465561, | |
| "eval_loss": 0.9810006618499756, | |
| "eval_runtime": 462.5023, | |
| "eval_samples_per_second": 10.956, | |
| "eval_steps_per_second": 1.371, | |
| "step": 35462 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.3539, | |
| "step": 37995 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_accuracy": 0.7049536214722716, | |
| "eval_loss": 0.9560312032699585, | |
| "eval_runtime": 460.5217, | |
| "eval_samples_per_second": 11.003, | |
| "eval_steps_per_second": 1.377, | |
| "step": 37995 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "learning_rate": 2.3333333333333336e-05, | |
| "loss": 0.3072, | |
| "step": 40528 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_accuracy": 0.7067298204065522, | |
| "eval_loss": 0.9344322085380554, | |
| "eval_runtime": 460.2866, | |
| "eval_samples_per_second": 11.008, | |
| "eval_steps_per_second": 1.377, | |
| "step": 40528 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "learning_rate": 2.1666666666666667e-05, | |
| "loss": 0.2729, | |
| "step": 43061 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_accuracy": 0.7128478389579633, | |
| "eval_loss": 0.8949710726737976, | |
| "eval_runtime": 464.9931, | |
| "eval_samples_per_second": 10.897, | |
| "eval_steps_per_second": 1.363, | |
| "step": 43061 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "learning_rate": 2e-05, | |
| "loss": 0.2416, | |
| "step": 45594 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_accuracy": 0.7049536214722716, | |
| "eval_loss": 0.8919546604156494, | |
| "eval_runtime": 462.6468, | |
| "eval_samples_per_second": 10.952, | |
| "eval_steps_per_second": 1.37, | |
| "step": 45594 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "learning_rate": 1.8333333333333333e-05, | |
| "loss": 0.2173, | |
| "step": 48127 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_accuracy": 0.7108742845865403, | |
| "eval_loss": 0.879001259803772, | |
| "eval_runtime": 461.3852, | |
| "eval_samples_per_second": 10.982, | |
| "eval_steps_per_second": 1.374, | |
| "step": 48127 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "learning_rate": 1.6666666666666667e-05, | |
| "loss": 0.1973, | |
| "step": 50660 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_accuracy": 0.7162028813893823, | |
| "eval_loss": 0.8711328506469727, | |
| "eval_runtime": 460.7389, | |
| "eval_samples_per_second": 10.998, | |
| "eval_steps_per_second": 1.376, | |
| "step": 50660 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "learning_rate": 1.5e-05, | |
| "loss": 0.1806, | |
| "step": 53193 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_accuracy": 0.7061377540951254, | |
| "eval_loss": 0.8637410998344421, | |
| "eval_runtime": 462.8193, | |
| "eval_samples_per_second": 10.948, | |
| "eval_steps_per_second": 1.37, | |
| "step": 53193 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "learning_rate": 1.3333333333333333e-05, | |
| "loss": 0.1662, | |
| "step": 55726 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_accuracy": 0.717387014012236, | |
| "eval_loss": 0.8513094186782837, | |
| "eval_runtime": 457.9446, | |
| "eval_samples_per_second": 11.065, | |
| "eval_steps_per_second": 1.384, | |
| "step": 55726 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "learning_rate": 1.1666666666666668e-05, | |
| "loss": 0.1549, | |
| "step": 58259 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_accuracy": 0.7156108150779554, | |
| "eval_loss": 0.8369139432907104, | |
| "eval_runtime": 459.9692, | |
| "eval_samples_per_second": 11.016, | |
| "eval_steps_per_second": 1.378, | |
| "step": 58259 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "learning_rate": 1e-05, | |
| "loss": 0.1443, | |
| "step": 60792 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_accuracy": 0.7138346161436747, | |
| "eval_loss": 0.8337984681129456, | |
| "eval_runtime": 455.8047, | |
| "eval_samples_per_second": 11.117, | |
| "eval_steps_per_second": 1.391, | |
| "step": 60792 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "learning_rate": 8.333333333333334e-06, | |
| "loss": 0.1347, | |
| "step": 63325 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_accuracy": 0.7191632129465166, | |
| "eval_loss": 0.8258342146873474, | |
| "eval_runtime": 460.9514, | |
| "eval_samples_per_second": 10.992, | |
| "eval_steps_per_second": 1.375, | |
| "step": 63325 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "learning_rate": 6.666666666666667e-06, | |
| "loss": 0.1271, | |
| "step": 65858 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_accuracy": 0.717387014012236, | |
| "eval_loss": 0.8176981210708618, | |
| "eval_runtime": 460.4508, | |
| "eval_samples_per_second": 11.004, | |
| "eval_steps_per_second": 1.377, | |
| "step": 65858 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "learning_rate": 5e-06, | |
| "loss": 0.1198, | |
| "step": 68391 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_accuracy": 0.7165975922636668, | |
| "eval_loss": 0.8105741739273071, | |
| "eval_runtime": 459.2895, | |
| "eval_samples_per_second": 11.032, | |
| "eval_steps_per_second": 1.38, | |
| "step": 68391 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "learning_rate": 3.3333333333333333e-06, | |
| "loss": 0.115, | |
| "step": 70924 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_accuracy": 0.7171896585750938, | |
| "eval_loss": 0.8162857890129089, | |
| "eval_runtime": 446.9777, | |
| "eval_samples_per_second": 11.336, | |
| "eval_steps_per_second": 1.418, | |
| "step": 70924 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "learning_rate": 1.6666666666666667e-06, | |
| "loss": 0.1101, | |
| "step": 73457 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_accuracy": 0.717387014012236, | |
| "eval_loss": 0.8069340586662292, | |
| "eval_runtime": 477.0626, | |
| "eval_samples_per_second": 10.621, | |
| "eval_steps_per_second": 1.329, | |
| "step": 73457 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 75990, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 30, | |
| "save_steps": 500, | |
| "total_flos": 1.2485637303036936e+19, | |
| "train_batch_size": 8, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |