{ "best_metric": 0.45652173913043476, "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-DMAE-U3\\checkpoint-42", "epoch": 34.285714285714285, "eval_steps": 500, "global_step": 120, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 7.932784557342529, "eval_runtime": 0.7282, "eval_samples_per_second": 63.171, "eval_steps_per_second": 4.12, "step": 3 }, { "epoch": 2.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 7.759629726409912, "eval_runtime": 0.8117, "eval_samples_per_second": 56.672, "eval_steps_per_second": 3.696, "step": 7 }, { "epoch": 2.86, "learning_rate": 5.3070175438596496e-05, "loss": 7.8559, "step": 10 }, { "epoch": 2.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 7.324063301086426, "eval_runtime": 0.7392, "eval_samples_per_second": 62.232, "eval_steps_per_second": 4.059, "step": 10 }, { "epoch": 4.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 6.445021152496338, "eval_runtime": 0.7442, "eval_samples_per_second": 61.814, "eval_steps_per_second": 4.031, "step": 14 }, { "epoch": 4.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 5.772275924682617, "eval_runtime": 0.7442, "eval_samples_per_second": 61.814, "eval_steps_per_second": 4.031, "step": 17 }, { "epoch": 5.71, "learning_rate": 4.824561403508772e-05, "loss": 6.3363, "step": 20 }, { "epoch": 6.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 4.877190113067627, "eval_runtime": 0.7352, "eval_samples_per_second": 62.57, "eval_steps_per_second": 4.081, "step": 21 }, { "epoch": 6.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 4.267832279205322, "eval_runtime": 0.7272, "eval_samples_per_second": 63.258, "eval_steps_per_second": 4.126, "step": 24 }, { "epoch": 8.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 3.500047445297241, "eval_runtime": 0.7392, "eval_samples_per_second": 62.231, "eval_steps_per_second": 4.059, "step": 28 }, { "epoch": 8.57, "learning_rate": 4.342105263157895e-05, "loss": 4.1887, "step": 30 }, { "epoch": 8.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 2.9766128063201904, "eval_runtime": 0.7322, "eval_samples_per_second": 62.827, "eval_steps_per_second": 4.097, "step": 31 }, { "epoch": 10.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 2.387573003768921, "eval_runtime": 0.7862, "eval_samples_per_second": 58.511, "eval_steps_per_second": 3.816, "step": 35 }, { "epoch": 10.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 2.0428757667541504, "eval_runtime": 0.7689, "eval_samples_per_second": 59.823, "eval_steps_per_second": 3.902, "step": 38 }, { "epoch": 11.43, "learning_rate": 3.859649122807018e-05, "loss": 2.602, "step": 40 }, { "epoch": 12.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.7136485576629639, "eval_runtime": 0.7451, "eval_samples_per_second": 61.733, "eval_steps_per_second": 4.026, "step": 42 }, { "epoch": 12.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.547783374786377, "eval_runtime": 0.7662, "eval_samples_per_second": 60.038, "eval_steps_per_second": 3.916, "step": 45 }, { "epoch": 14.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.3874478340148926, "eval_runtime": 0.8637, "eval_samples_per_second": 53.259, "eval_steps_per_second": 3.473, "step": 49 }, { "epoch": 14.29, "learning_rate": 3.377192982456141e-05, "loss": 1.6353, "step": 50 }, { "epoch": 14.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.296812653541565, "eval_runtime": 0.8092, "eval_samples_per_second": 56.848, "eval_steps_per_second": 3.707, "step": 52 }, { "epoch": 16.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2225128412246704, "eval_runtime": 0.7957, "eval_samples_per_second": 57.812, "eval_steps_per_second": 3.77, "step": 56 }, { "epoch": 16.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2070940732955933, "eval_runtime": 0.7367, "eval_samples_per_second": 62.443, "eval_steps_per_second": 4.072, "step": 59 }, { "epoch": 17.14, "learning_rate": 2.894736842105263e-05, "loss": 1.2533, "step": 60 }, { "epoch": 18.0, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.2176765203475952, "eval_runtime": 0.7782, "eval_samples_per_second": 59.111, "eval_steps_per_second": 3.855, "step": 63 }, { "epoch": 18.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.2196648120880127, "eval_runtime": 0.8362, "eval_samples_per_second": 55.012, "eval_steps_per_second": 3.588, "step": 66 }, { "epoch": 20.0, "learning_rate": 2.412280701754386e-05, "loss": 1.2088, "step": 70 }, { "epoch": 20.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.211230754852295, "eval_runtime": 0.8632, "eval_samples_per_second": 53.29, "eval_steps_per_second": 3.475, "step": 70 }, { "epoch": 20.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.210147738456726, "eval_runtime": 0.7454, "eval_samples_per_second": 61.711, "eval_steps_per_second": 4.025, "step": 73 }, { "epoch": 22.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2092347145080566, "eval_runtime": 0.7592, "eval_samples_per_second": 60.592, "eval_steps_per_second": 3.952, "step": 77 }, { "epoch": 22.86, "learning_rate": 1.929824561403509e-05, "loss": 1.1798, "step": 80 }, { "epoch": 22.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2081409692764282, "eval_runtime": 0.9141, "eval_samples_per_second": 50.323, "eval_steps_per_second": 3.282, "step": 80 }, { "epoch": 24.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2076103687286377, "eval_runtime": 0.7367, "eval_samples_per_second": 62.44, "eval_steps_per_second": 4.072, "step": 84 }, { "epoch": 24.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2048611640930176, "eval_runtime": 0.7435, "eval_samples_per_second": 61.867, "eval_steps_per_second": 4.035, "step": 87 }, { "epoch": 25.71, "learning_rate": 1.4473684210526315e-05, "loss": 1.1825, "step": 90 }, { "epoch": 26.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2044618129730225, "eval_runtime": 0.8012, "eval_samples_per_second": 57.414, "eval_steps_per_second": 3.744, "step": 91 }, { "epoch": 26.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2028782367706299, "eval_runtime": 0.7207, "eval_samples_per_second": 63.83, "eval_steps_per_second": 4.163, "step": 94 }, { "epoch": 28.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2022422552108765, "eval_runtime": 0.7542, "eval_samples_per_second": 60.994, "eval_steps_per_second": 3.978, "step": 98 }, { "epoch": 28.57, "learning_rate": 9.649122807017545e-06, "loss": 1.1943, "step": 100 }, { "epoch": 28.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2013744115829468, "eval_runtime": 0.7562, "eval_samples_per_second": 60.833, "eval_steps_per_second": 3.967, "step": 101 }, { "epoch": 30.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2039952278137207, "eval_runtime": 0.7452, "eval_samples_per_second": 61.731, "eval_steps_per_second": 4.026, "step": 105 }, { "epoch": 30.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2050013542175293, "eval_runtime": 0.7652, "eval_samples_per_second": 60.117, "eval_steps_per_second": 3.921, "step": 108 }, { "epoch": 31.43, "learning_rate": 4.824561403508772e-06, "loss": 1.1772, "step": 110 }, { "epoch": 32.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2031123638153076, "eval_runtime": 0.7692, "eval_samples_per_second": 59.805, "eval_steps_per_second": 3.9, "step": 112 }, { "epoch": 32.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.201911449432373, "eval_runtime": 0.7212, "eval_samples_per_second": 63.786, "eval_steps_per_second": 4.16, "step": 115 }, { "epoch": 34.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2012614011764526, "eval_runtime": 0.7902, "eval_samples_per_second": 58.214, "eval_steps_per_second": 3.797, "step": 119 }, { "epoch": 34.29, "learning_rate": 0.0, "loss": 1.1945, "step": 120 }, { "epoch": 34.29, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.201164960861206, "eval_runtime": 0.7465, "eval_samples_per_second": 61.619, "eval_steps_per_second": 4.019, "step": 120 }, { "epoch": 34.29, "step": 120, "total_flos": 2.3770905934823424e+17, "train_loss": 2.584045958518982, "train_runtime": 203.0479, "train_samples_per_second": 41.961, "train_steps_per_second": 0.591 } ], "logging_steps": 10, "max_steps": 120, "num_input_tokens_seen": 0, "num_train_epochs": 40, "save_steps": 500, "total_flos": 2.3770905934823424e+17, "train_batch_size": 16, "trial_name": null, "trial_params": null }