{ "best_metric": 0.35881221294403076, "best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-1120", "epoch": 70.0, "eval_steps": 500, "global_step": 1120, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6946107784431138, "eval_loss": 1.4309433698654175, "eval_runtime": 4.3566, "eval_samples_per_second": 76.666, "eval_steps_per_second": 9.641, "step": 16 }, { "epoch": 2.0, "eval_accuracy": 0.7035928143712575, "eval_loss": 1.3571979999542236, "eval_runtime": 4.4448, "eval_samples_per_second": 75.144, "eval_steps_per_second": 9.449, "step": 32 }, { "epoch": 3.0, "eval_accuracy": 0.7095808383233533, "eval_loss": 1.2381948232650757, "eval_runtime": 4.5106, "eval_samples_per_second": 74.048, "eval_steps_per_second": 9.311, "step": 48 }, { "epoch": 4.0, "eval_accuracy": 0.7485029940119761, "eval_loss": 1.1571621894836426, "eval_runtime": 4.3237, "eval_samples_per_second": 77.249, "eval_steps_per_second": 9.714, "step": 64 }, { "epoch": 5.0, "eval_accuracy": 0.7544910179640718, "eval_loss": 1.1075578927993774, "eval_runtime": 4.3443, "eval_samples_per_second": 76.883, "eval_steps_per_second": 9.668, "step": 80 }, { "epoch": 6.0, "eval_accuracy": 0.7544910179640718, "eval_loss": 1.0685527324676514, "eval_runtime": 4.4445, "eval_samples_per_second": 75.149, "eval_steps_per_second": 9.45, "step": 96 }, { "epoch": 7.0, "eval_accuracy": 0.7574850299401198, "eval_loss": 1.0224419832229614, "eval_runtime": 4.3333, "eval_samples_per_second": 77.078, "eval_steps_per_second": 9.692, "step": 112 }, { "epoch": 8.0, "eval_accuracy": 0.7604790419161677, "eval_loss": 0.9735947847366333, "eval_runtime": 4.4514, "eval_samples_per_second": 75.033, "eval_steps_per_second": 9.435, "step": 128 }, { "epoch": 9.0, "eval_accuracy": 0.7634730538922155, "eval_loss": 0.935190737247467, "eval_runtime": 4.483, "eval_samples_per_second": 74.504, "eval_steps_per_second": 9.369, "step": 144 }, { "epoch": 10.0, "eval_accuracy": 0.7574850299401198, "eval_loss": 0.8989432454109192, "eval_runtime": 4.3947, "eval_samples_per_second": 76.0, "eval_steps_per_second": 9.557, "step": 160 }, { "epoch": 11.0, "eval_accuracy": 0.7514970059880239, "eval_loss": 0.8565046787261963, "eval_runtime": 4.4679, "eval_samples_per_second": 74.755, "eval_steps_per_second": 9.4, "step": 176 }, { "epoch": 12.0, "eval_accuracy": 0.7634730538922155, "eval_loss": 0.8191085457801819, "eval_runtime": 4.4986, "eval_samples_per_second": 74.245, "eval_steps_per_second": 9.336, "step": 192 }, { "epoch": 13.0, "eval_accuracy": 0.7634730538922155, "eval_loss": 0.783191442489624, "eval_runtime": 4.5843, "eval_samples_per_second": 72.857, "eval_steps_per_second": 9.162, "step": 208 }, { "epoch": 14.0, "eval_accuracy": 0.7724550898203593, "eval_loss": 0.7542709708213806, "eval_runtime": 4.417, "eval_samples_per_second": 75.617, "eval_steps_per_second": 9.509, "step": 224 }, { "epoch": 15.0, "eval_accuracy": 0.7694610778443114, "eval_loss": 0.7199692130088806, "eval_runtime": 4.401, "eval_samples_per_second": 75.891, "eval_steps_per_second": 9.543, "step": 240 }, { "epoch": 16.0, "eval_accuracy": 0.7754491017964071, "eval_loss": 0.6858012676239014, "eval_runtime": 4.4254, "eval_samples_per_second": 75.474, "eval_steps_per_second": 9.491, "step": 256 }, { "epoch": 17.0, "eval_accuracy": 0.7784431137724551, "eval_loss": 0.6566184759140015, "eval_runtime": 4.4216, "eval_samples_per_second": 75.539, "eval_steps_per_second": 9.499, "step": 272 }, { "epoch": 18.0, "eval_accuracy": 0.7844311377245509, "eval_loss": 0.628990650177002, "eval_runtime": 4.4307, "eval_samples_per_second": 75.383, "eval_steps_per_second": 9.479, "step": 288 }, { "epoch": 19.0, "eval_accuracy": 0.7844311377245509, "eval_loss": 0.6014779210090637, "eval_runtime": 4.3612, "eval_samples_per_second": 76.584, "eval_steps_per_second": 9.63, "step": 304 }, { "epoch": 20.0, "eval_accuracy": 0.7904191616766467, "eval_loss": 0.5828869938850403, "eval_runtime": 4.3656, "eval_samples_per_second": 76.508, "eval_steps_per_second": 9.621, "step": 320 }, { "epoch": 21.0, "eval_accuracy": 0.7904191616766467, "eval_loss": 0.560990571975708, "eval_runtime": 4.4037, "eval_samples_per_second": 75.846, "eval_steps_per_second": 9.538, "step": 336 }, { "epoch": 22.0, "eval_accuracy": 0.7904191616766467, "eval_loss": 0.5444124937057495, "eval_runtime": 4.4206, "eval_samples_per_second": 75.556, "eval_steps_per_second": 9.501, "step": 352 }, { "epoch": 23.0, "eval_accuracy": 0.7964071856287425, "eval_loss": 0.5321463346481323, "eval_runtime": 4.402, "eval_samples_per_second": 75.875, "eval_steps_per_second": 9.541, "step": 368 }, { "epoch": 24.0, "eval_accuracy": 0.8023952095808383, "eval_loss": 0.521594226360321, "eval_runtime": 4.4337, "eval_samples_per_second": 75.331, "eval_steps_per_second": 9.473, "step": 384 }, { "epoch": 25.0, "eval_accuracy": 0.8053892215568862, "eval_loss": 0.5053771138191223, "eval_runtime": 4.4563, "eval_samples_per_second": 74.95, "eval_steps_per_second": 9.425, "step": 400 }, { "epoch": 26.0, "eval_accuracy": 0.8143712574850299, "eval_loss": 0.4930258095264435, "eval_runtime": 4.3955, "eval_samples_per_second": 75.986, "eval_steps_per_second": 9.555, "step": 416 }, { "epoch": 27.0, "eval_accuracy": 0.811377245508982, "eval_loss": 0.4849102795124054, "eval_runtime": 4.4566, "eval_samples_per_second": 74.945, "eval_steps_per_second": 9.424, "step": 432 }, { "epoch": 28.0, "eval_accuracy": 0.811377245508982, "eval_loss": 0.47692808508872986, "eval_runtime": 4.4557, "eval_samples_per_second": 74.959, "eval_steps_per_second": 9.426, "step": 448 }, { "epoch": 29.0, "eval_accuracy": 0.8293413173652695, "eval_loss": 0.46685636043548584, "eval_runtime": 4.3405, "eval_samples_per_second": 76.949, "eval_steps_per_second": 9.676, "step": 464 }, { "epoch": 30.0, "eval_accuracy": 0.8323353293413174, "eval_loss": 0.45782506465911865, "eval_runtime": 4.3468, "eval_samples_per_second": 76.838, "eval_steps_per_second": 9.662, "step": 480 }, { "epoch": 31.0, "eval_accuracy": 0.8323353293413174, "eval_loss": 0.44891008734703064, "eval_runtime": 4.5111, "eval_samples_per_second": 74.039, "eval_steps_per_second": 9.31, "step": 496 }, { "epoch": 31.25, "grad_norm": 3.9690632820129395, "learning_rate": 8.098055790363483e-07, "loss": 0.6987, "step": 500 }, { "epoch": 32.0, "eval_accuracy": 0.8323353293413174, "eval_loss": 0.4414936900138855, "eval_runtime": 4.3863, "eval_samples_per_second": 76.146, "eval_steps_per_second": 9.575, "step": 512 }, { "epoch": 33.0, "eval_accuracy": 0.8323353293413174, "eval_loss": 0.435556560754776, "eval_runtime": 4.3922, "eval_samples_per_second": 76.043, "eval_steps_per_second": 9.562, "step": 528 }, { "epoch": 34.0, "eval_accuracy": 0.8323353293413174, "eval_loss": 0.4296257793903351, "eval_runtime": 4.3498, "eval_samples_per_second": 76.785, "eval_steps_per_second": 9.656, "step": 544 }, { "epoch": 35.0, "eval_accuracy": 0.8323353293413174, "eval_loss": 0.4240988492965698, "eval_runtime": 4.3863, "eval_samples_per_second": 76.146, "eval_steps_per_second": 9.575, "step": 560 }, { "epoch": 36.0, "eval_accuracy": 0.8353293413173652, "eval_loss": 0.41868290305137634, "eval_runtime": 4.4309, "eval_samples_per_second": 75.38, "eval_steps_per_second": 9.479, "step": 576 }, { "epoch": 37.0, "eval_accuracy": 0.8383233532934131, "eval_loss": 0.413825124502182, "eval_runtime": 4.3459, "eval_samples_per_second": 76.853, "eval_steps_per_second": 9.664, "step": 592 }, { "epoch": 38.0, "eval_accuracy": 0.8413173652694611, "eval_loss": 0.4092709720134735, "eval_runtime": 4.353, "eval_samples_per_second": 76.728, "eval_steps_per_second": 9.648, "step": 608 }, { "epoch": 39.0, "eval_accuracy": 0.8413173652694611, "eval_loss": 0.40586671233177185, "eval_runtime": 4.3701, "eval_samples_per_second": 76.429, "eval_steps_per_second": 9.611, "step": 624 }, { "epoch": 40.0, "eval_accuracy": 0.8502994011976048, "eval_loss": 0.401659220457077, "eval_runtime": 4.4026, "eval_samples_per_second": 75.864, "eval_steps_per_second": 9.54, "step": 640 }, { "epoch": 41.0, "eval_accuracy": 0.8502994011976048, "eval_loss": 0.3979702293872833, "eval_runtime": 4.5672, "eval_samples_per_second": 73.13, "eval_steps_per_second": 9.196, "step": 656 }, { "epoch": 42.0, "eval_accuracy": 0.8502994011976048, "eval_loss": 0.3946226239204407, "eval_runtime": 4.3743, "eval_samples_per_second": 76.354, "eval_steps_per_second": 9.601, "step": 672 }, { "epoch": 43.0, "eval_accuracy": 0.8473053892215568, "eval_loss": 0.39317673444747925, "eval_runtime": 4.3247, "eval_samples_per_second": 77.23, "eval_steps_per_second": 9.712, "step": 688 }, { "epoch": 44.0, "eval_accuracy": 0.8473053892215568, "eval_loss": 0.389418363571167, "eval_runtime": 4.4405, "eval_samples_per_second": 75.216, "eval_steps_per_second": 9.458, "step": 704 }, { "epoch": 45.0, "eval_accuracy": 0.8473053892215568, "eval_loss": 0.3862323462963104, "eval_runtime": 4.3815, "eval_samples_per_second": 76.23, "eval_steps_per_second": 9.586, "step": 720 }, { "epoch": 46.0, "eval_accuracy": 0.8502994011976048, "eval_loss": 0.384316086769104, "eval_runtime": 4.4286, "eval_samples_per_second": 75.42, "eval_steps_per_second": 9.484, "step": 736 }, { "epoch": 47.0, "eval_accuracy": 0.844311377245509, "eval_loss": 0.383512943983078, "eval_runtime": 4.4251, "eval_samples_per_second": 75.479, "eval_steps_per_second": 9.491, "step": 752 }, { "epoch": 48.0, "eval_accuracy": 0.8622754491017964, "eval_loss": 0.3795510232448578, "eval_runtime": 4.4626, "eval_samples_per_second": 74.844, "eval_steps_per_second": 9.412, "step": 768 }, { "epoch": 49.0, "eval_accuracy": 0.8592814371257484, "eval_loss": 0.3759188950061798, "eval_runtime": 4.3421, "eval_samples_per_second": 76.921, "eval_steps_per_second": 9.673, "step": 784 }, { "epoch": 50.0, "eval_accuracy": 0.8652694610778443, "eval_loss": 0.37549516558647156, "eval_runtime": 4.4076, "eval_samples_per_second": 75.778, "eval_steps_per_second": 9.529, "step": 800 }, { "epoch": 51.0, "eval_accuracy": 0.8622754491017964, "eval_loss": 0.3745565414428711, "eval_runtime": 4.466, "eval_samples_per_second": 74.787, "eval_steps_per_second": 9.404, "step": 816 }, { "epoch": 52.0, "eval_accuracy": 0.8652694610778443, "eval_loss": 0.37246376276016235, "eval_runtime": 4.3519, "eval_samples_per_second": 76.748, "eval_steps_per_second": 9.651, "step": 832 }, { "epoch": 53.0, "eval_accuracy": 0.8652694610778443, "eval_loss": 0.36974743008613586, "eval_runtime": 4.4116, "eval_samples_per_second": 75.709, "eval_steps_per_second": 9.52, "step": 848 }, { "epoch": 54.0, "eval_accuracy": 0.874251497005988, "eval_loss": 0.3688933253288269, "eval_runtime": 4.373, "eval_samples_per_second": 76.377, "eval_steps_per_second": 9.604, "step": 864 }, { "epoch": 55.0, "eval_accuracy": 0.874251497005988, "eval_loss": 0.3665659427642822, "eval_runtime": 4.3847, "eval_samples_per_second": 76.173, "eval_steps_per_second": 9.579, "step": 880 }, { "epoch": 56.0, "eval_accuracy": 0.874251497005988, "eval_loss": 0.3666609227657318, "eval_runtime": 4.4937, "eval_samples_per_second": 74.326, "eval_steps_per_second": 9.346, "step": 896 }, { "epoch": 57.0, "eval_accuracy": 0.8802395209580839, "eval_loss": 0.366781622171402, "eval_runtime": 4.4056, "eval_samples_per_second": 75.812, "eval_steps_per_second": 9.533, "step": 912 }, { "epoch": 58.0, "eval_accuracy": 0.8802395209580839, "eval_loss": 0.3661949932575226, "eval_runtime": 4.4335, "eval_samples_per_second": 75.336, "eval_steps_per_second": 9.473, "step": 928 }, { "epoch": 59.0, "eval_accuracy": 0.8802395209580839, "eval_loss": 0.36339056491851807, "eval_runtime": 4.4117, "eval_samples_per_second": 75.708, "eval_steps_per_second": 9.52, "step": 944 }, { "epoch": 60.0, "eval_accuracy": 0.8772455089820359, "eval_loss": 0.36299723386764526, "eval_runtime": 4.4436, "eval_samples_per_second": 75.165, "eval_steps_per_second": 9.452, "step": 960 }, { "epoch": 61.0, "eval_accuracy": 0.8832335329341318, "eval_loss": 0.3644971549510956, "eval_runtime": 4.3789, "eval_samples_per_second": 76.274, "eval_steps_per_second": 9.591, "step": 976 }, { "epoch": 62.0, "eval_accuracy": 0.8832335329341318, "eval_loss": 0.3652717173099518, "eval_runtime": 4.3124, "eval_samples_per_second": 77.452, "eval_steps_per_second": 9.739, "step": 992 }, { "epoch": 62.5, "grad_norm": 1.597828984260559, "learning_rate": 5.984784446322908e-07, "loss": 0.1919, "step": 1000 }, { "epoch": 63.0, "eval_accuracy": 0.8832335329341318, "eval_loss": 0.3627488911151886, "eval_runtime": 4.4759, "eval_samples_per_second": 74.622, "eval_steps_per_second": 9.384, "step": 1008 }, { "epoch": 64.0, "eval_accuracy": 0.8772455089820359, "eval_loss": 0.3642951548099518, "eval_runtime": 4.4875, "eval_samples_per_second": 74.428, "eval_steps_per_second": 9.359, "step": 1024 }, { "epoch": 65.0, "eval_accuracy": 0.874251497005988, "eval_loss": 0.3665095567703247, "eval_runtime": 4.39, "eval_samples_per_second": 76.083, "eval_steps_per_second": 9.567, "step": 1040 }, { "epoch": 66.0, "eval_accuracy": 0.8772455089820359, "eval_loss": 0.3633537292480469, "eval_runtime": 4.4453, "eval_samples_per_second": 75.135, "eval_steps_per_second": 9.448, "step": 1056 }, { "epoch": 67.0, "eval_accuracy": 0.8772455089820359, "eval_loss": 0.36282193660736084, "eval_runtime": 4.4608, "eval_samples_per_second": 74.875, "eval_steps_per_second": 9.415, "step": 1072 }, { "epoch": 68.0, "eval_accuracy": 0.874251497005988, "eval_loss": 0.36409279704093933, "eval_runtime": 4.3878, "eval_samples_per_second": 76.119, "eval_steps_per_second": 9.572, "step": 1088 }, { "epoch": 69.0, "eval_accuracy": 0.8772455089820359, "eval_loss": 0.3623464107513428, "eval_runtime": 4.4706, "eval_samples_per_second": 74.711, "eval_steps_per_second": 9.395, "step": 1104 }, { "epoch": 70.0, "eval_accuracy": 0.8772455089820359, "eval_loss": 0.35881221294403076, "eval_runtime": 4.3641, "eval_samples_per_second": 76.533, "eval_steps_per_second": 9.624, "step": 1120 } ], "logging_steps": 500, "max_steps": 2416, "num_input_tokens_seen": 0, "num_train_epochs": 151, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 2.71221963651072e+18, "train_batch_size": 32, "trial_name": null, "trial_params": null }