{ "best_metric": 0.6739130434782609, "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-DMAE-3e-5\\checkpoint-94", "epoch": 34.285714285714285, "eval_steps": 500, "global_step": 120, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 1.6337018013000488, "eval_runtime": 0.8832, "eval_samples_per_second": 52.083, "eval_steps_per_second": 3.397, "step": 3 }, { "epoch": 2.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 1.622289776802063, "eval_runtime": 0.9452, "eval_samples_per_second": 48.666, "eval_steps_per_second": 3.174, "step": 7 }, { "epoch": 2.86, "learning_rate": 2.5e-05, "loss": 1.6298, "step": 10 }, { "epoch": 2.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 1.5971730947494507, "eval_runtime": 0.6641, "eval_samples_per_second": 69.268, "eval_steps_per_second": 4.517, "step": 10 }, { "epoch": 4.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 1.5040873289108276, "eval_runtime": 0.7672, "eval_samples_per_second": 59.96, "eval_steps_per_second": 3.91, "step": 14 }, { "epoch": 4.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 1.4149224758148193, "eval_runtime": 0.8815, "eval_samples_per_second": 52.182, "eval_steps_per_second": 3.403, "step": 17 }, { "epoch": 5.71, "learning_rate": 2.777777777777778e-05, "loss": 1.4858, "step": 20 }, { "epoch": 6.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.3036504983901978, "eval_runtime": 0.6381, "eval_samples_per_second": 72.084, "eval_steps_per_second": 4.701, "step": 21 }, { "epoch": 6.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2491180896759033, "eval_runtime": 0.6833, "eval_samples_per_second": 67.325, "eval_steps_per_second": 4.391, "step": 24 }, { "epoch": 8.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2219406366348267, "eval_runtime": 0.6631, "eval_samples_per_second": 69.366, "eval_steps_per_second": 4.524, "step": 28 }, { "epoch": 8.57, "learning_rate": 2.5e-05, "loss": 1.2337, "step": 30 }, { "epoch": 8.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2146371603012085, "eval_runtime": 0.6597, "eval_samples_per_second": 69.732, "eval_steps_per_second": 4.548, "step": 31 }, { "epoch": 10.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.214502215385437, "eval_runtime": 0.6581, "eval_samples_per_second": 69.893, "eval_steps_per_second": 4.558, "step": 35 }, { "epoch": 10.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.211630940437317, "eval_runtime": 0.6381, "eval_samples_per_second": 72.083, "eval_steps_per_second": 4.701, "step": 38 }, { "epoch": 11.43, "learning_rate": 2.222222222222222e-05, "loss": 1.1726, "step": 40 }, { "epoch": 12.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2064777612686157, "eval_runtime": 0.6501, "eval_samples_per_second": 70.753, "eval_steps_per_second": 4.614, "step": 42 }, { "epoch": 12.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.201141357421875, "eval_runtime": 0.6601, "eval_samples_per_second": 69.681, "eval_steps_per_second": 4.544, "step": 45 }, { "epoch": 14.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.1940866708755493, "eval_runtime": 0.6627, "eval_samples_per_second": 69.413, "eval_steps_per_second": 4.527, "step": 49 }, { "epoch": 14.29, "learning_rate": 1.9444444444444445e-05, "loss": 1.1953, "step": 50 }, { "epoch": 14.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.18779456615448, "eval_runtime": 0.695, "eval_samples_per_second": 66.19, "eval_steps_per_second": 4.317, "step": 52 }, { "epoch": 16.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.1770756244659424, "eval_runtime": 0.6902, "eval_samples_per_second": 66.652, "eval_steps_per_second": 4.347, "step": 56 }, { "epoch": 16.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.1677342653274536, "eval_runtime": 0.6555, "eval_samples_per_second": 70.174, "eval_steps_per_second": 4.577, "step": 59 }, { "epoch": 17.14, "learning_rate": 1.6666666666666667e-05, "loss": 1.1602, "step": 60 }, { "epoch": 18.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.1564418077468872, "eval_runtime": 0.6792, "eval_samples_per_second": 67.731, "eval_steps_per_second": 4.417, "step": 63 }, { "epoch": 18.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.1501902341842651, "eval_runtime": 0.6591, "eval_samples_per_second": 69.795, "eval_steps_per_second": 4.552, "step": 66 }, { "epoch": 20.0, "learning_rate": 1.388888888888889e-05, "loss": 1.1415, "step": 70 }, { "epoch": 20.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.1226557493209839, "eval_runtime": 0.6682, "eval_samples_per_second": 68.846, "eval_steps_per_second": 4.49, "step": 70 }, { "epoch": 20.86, "eval_accuracy": 0.4782608695652174, "eval_loss": 1.101697564125061, "eval_runtime": 0.6411, "eval_samples_per_second": 71.747, "eval_steps_per_second": 4.679, "step": 73 }, { "epoch": 22.0, "eval_accuracy": 0.5869565217391305, "eval_loss": 1.0871663093566895, "eval_runtime": 0.6591, "eval_samples_per_second": 69.787, "eval_steps_per_second": 4.551, "step": 77 }, { "epoch": 22.86, "learning_rate": 1.111111111111111e-05, "loss": 1.0949, "step": 80 }, { "epoch": 22.86, "eval_accuracy": 0.5869565217391305, "eval_loss": 1.0795304775238037, "eval_runtime": 0.6621, "eval_samples_per_second": 69.471, "eval_steps_per_second": 4.531, "step": 80 }, { "epoch": 24.0, "eval_accuracy": 0.6086956521739131, "eval_loss": 1.0581977367401123, "eval_runtime": 0.6631, "eval_samples_per_second": 69.366, "eval_steps_per_second": 4.524, "step": 84 }, { "epoch": 24.86, "eval_accuracy": 0.6086956521739131, "eval_loss": 1.0401618480682373, "eval_runtime": 0.7072, "eval_samples_per_second": 65.047, "eval_steps_per_second": 4.242, "step": 87 }, { "epoch": 25.71, "learning_rate": 8.333333333333334e-06, "loss": 1.0559, "step": 90 }, { "epoch": 26.0, "eval_accuracy": 0.6521739130434783, "eval_loss": 1.0186063051223755, "eval_runtime": 0.6467, "eval_samples_per_second": 71.135, "eval_steps_per_second": 4.639, "step": 91 }, { "epoch": 26.86, "eval_accuracy": 0.6739130434782609, "eval_loss": 1.01261305809021, "eval_runtime": 0.6762, "eval_samples_per_second": 68.031, "eval_steps_per_second": 4.437, "step": 94 }, { "epoch": 28.0, "eval_accuracy": 0.6739130434782609, "eval_loss": 1.0032662153244019, "eval_runtime": 0.6702, "eval_samples_per_second": 68.639, "eval_steps_per_second": 4.476, "step": 98 }, { "epoch": 28.57, "learning_rate": 5.555555555555555e-06, "loss": 1.0423, "step": 100 }, { "epoch": 28.86, "eval_accuracy": 0.6739130434782609, "eval_loss": 0.9848656058311462, "eval_runtime": 0.6762, "eval_samples_per_second": 68.029, "eval_steps_per_second": 4.437, "step": 101 }, { "epoch": 30.0, "eval_accuracy": 0.6739130434782609, "eval_loss": 0.9669570922851562, "eval_runtime": 0.6637, "eval_samples_per_second": 69.314, "eval_steps_per_second": 4.52, "step": 105 }, { "epoch": 30.86, "eval_accuracy": 0.6739130434782609, "eval_loss": 0.9630699753761292, "eval_runtime": 0.8147, "eval_samples_per_second": 56.462, "eval_steps_per_second": 3.682, "step": 108 }, { "epoch": 31.43, "learning_rate": 2.7777777777777775e-06, "loss": 1.0002, "step": 110 }, { "epoch": 32.0, "eval_accuracy": 0.6521739130434783, "eval_loss": 0.9599204659461975, "eval_runtime": 0.6631, "eval_samples_per_second": 69.366, "eval_steps_per_second": 4.524, "step": 112 }, { "epoch": 32.86, "eval_accuracy": 0.6521739130434783, "eval_loss": 0.9586823582649231, "eval_runtime": 0.6661, "eval_samples_per_second": 69.054, "eval_steps_per_second": 4.503, "step": 115 }, { "epoch": 34.0, "eval_accuracy": 0.6521739130434783, "eval_loss": 0.9573362469673157, "eval_runtime": 0.6584, "eval_samples_per_second": 69.871, "eval_steps_per_second": 4.557, "step": 119 }, { "epoch": 34.29, "learning_rate": 0.0, "loss": 1.0077, "step": 120 }, { "epoch": 34.29, "eval_accuracy": 0.6521739130434783, "eval_loss": 0.9570884704589844, "eval_runtime": 0.6737, "eval_samples_per_second": 68.281, "eval_steps_per_second": 4.453, "step": 120 }, { "epoch": 34.29, "step": 120, "total_flos": 2.3770905934823424e+17, "train_loss": 1.18499755859375, "train_runtime": 199.3828, "train_samples_per_second": 42.732, "train_steps_per_second": 0.602 } ], "logging_steps": 10, "max_steps": 120, "num_input_tokens_seen": 0, "num_train_epochs": 40, "save_steps": 500, "total_flos": 2.3770905934823424e+17, "train_batch_size": 16, "trial_name": null, "trial_params": null }