{ "best_metric": 0.45652173913043476, "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-DMAE-5e-2\\checkpoint-10", "epoch": 34.285714285714285, "eval_steps": 500, "global_step": 120, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 22.410741806030273, "eval_runtime": 0.7553, "eval_samples_per_second": 60.901, "eval_steps_per_second": 3.972, "step": 3 }, { "epoch": 2.0, "eval_accuracy": 0.32608695652173914, "eval_loss": 11.26321792602539, "eval_runtime": 0.7728, "eval_samples_per_second": 59.527, "eval_steps_per_second": 3.882, "step": 7 }, { "epoch": 2.86, "learning_rate": 0.04583333333333334, "loss": 15.4384, "step": 10 }, { "epoch": 2.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 8.339312553405762, "eval_runtime": 0.7917, "eval_samples_per_second": 58.104, "eval_steps_per_second": 3.789, "step": 10 }, { "epoch": 4.0, "eval_accuracy": 0.10869565217391304, "eval_loss": 2.280815839767456, "eval_runtime": 0.7452, "eval_samples_per_second": 61.731, "eval_steps_per_second": 4.026, "step": 14 }, { "epoch": 4.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 2.978447198867798, "eval_runtime": 0.7387, "eval_samples_per_second": 62.273, "eval_steps_per_second": 4.061, "step": 17 }, { "epoch": 5.71, "learning_rate": 0.04166666666666667, "loss": 4.9288, "step": 20 }, { "epoch": 6.0, "eval_accuracy": 0.32608695652173914, "eval_loss": 2.475663900375366, "eval_runtime": 0.7452, "eval_samples_per_second": 61.731, "eval_steps_per_second": 4.026, "step": 21 }, { "epoch": 6.86, "eval_accuracy": 0.10869565217391304, "eval_loss": 2.5933523178100586, "eval_runtime": 0.7372, "eval_samples_per_second": 62.399, "eval_steps_per_second": 4.07, "step": 24 }, { "epoch": 8.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 2.3187241554260254, "eval_runtime": 0.7272, "eval_samples_per_second": 63.258, "eval_steps_per_second": 4.126, "step": 28 }, { "epoch": 8.57, "learning_rate": 0.037500000000000006, "loss": 2.426, "step": 30 }, { "epoch": 8.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.7270220518112183, "eval_runtime": 0.7982, "eval_samples_per_second": 57.631, "eval_steps_per_second": 3.759, "step": 31 }, { "epoch": 10.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.4868004322052002, "eval_runtime": 0.7112, "eval_samples_per_second": 64.683, "eval_steps_per_second": 4.218, "step": 35 }, { "epoch": 10.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.3056219816207886, "eval_runtime": 0.7972, "eval_samples_per_second": 57.704, "eval_steps_per_second": 3.763, "step": 38 }, { "epoch": 11.43, "learning_rate": 0.03333333333333333, "loss": 1.5653, "step": 40 }, { "epoch": 12.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2236616611480713, "eval_runtime": 0.7612, "eval_samples_per_second": 60.433, "eval_steps_per_second": 3.941, "step": 42 }, { "epoch": 12.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.4644097089767456, "eval_runtime": 0.7272, "eval_samples_per_second": 63.26, "eval_steps_per_second": 4.126, "step": 45 }, { "epoch": 14.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2427252531051636, "eval_runtime": 0.7122, "eval_samples_per_second": 64.592, "eval_steps_per_second": 4.213, "step": 49 }, { "epoch": 14.29, "learning_rate": 0.02916666666666667, "loss": 1.4578, "step": 50 }, { "epoch": 14.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.247389554977417, "eval_runtime": 0.7527, "eval_samples_per_second": 61.115, "eval_steps_per_second": 3.986, "step": 52 }, { "epoch": 16.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.3440945148468018, "eval_runtime": 0.7337, "eval_samples_per_second": 62.698, "eval_steps_per_second": 4.089, "step": 56 }, { "epoch": 16.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.3480498790740967, "eval_runtime": 0.8027, "eval_samples_per_second": 57.306, "eval_steps_per_second": 3.737, "step": 59 }, { "epoch": 17.14, "learning_rate": 0.025, "loss": 1.3492, "step": 60 }, { "epoch": 18.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2835181951522827, "eval_runtime": 0.7937, "eval_samples_per_second": 57.957, "eval_steps_per_second": 3.78, "step": 63 }, { "epoch": 18.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.3153202533721924, "eval_runtime": 0.7487, "eval_samples_per_second": 61.442, "eval_steps_per_second": 4.007, "step": 66 }, { "epoch": 20.0, "learning_rate": 0.020833333333333336, "loss": 1.3089, "step": 70 }, { "epoch": 20.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2387202978134155, "eval_runtime": 0.8447, "eval_samples_per_second": 54.457, "eval_steps_per_second": 3.552, "step": 70 }, { "epoch": 20.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.2538148164749146, "eval_runtime": 0.7427, "eval_samples_per_second": 61.938, "eval_steps_per_second": 4.039, "step": 73 }, { "epoch": 22.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2386040687561035, "eval_runtime": 0.8212, "eval_samples_per_second": 56.017, "eval_steps_per_second": 3.653, "step": 77 }, { "epoch": 22.86, "learning_rate": 0.016666666666666666, "loss": 1.2345, "step": 80 }, { "epoch": 22.86, "eval_accuracy": 0.32608695652173914, "eval_loss": 1.261245608329773, "eval_runtime": 0.8717, "eval_samples_per_second": 52.77, "eval_steps_per_second": 3.442, "step": 80 }, { "epoch": 24.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2124842405319214, "eval_runtime": 0.8932, "eval_samples_per_second": 51.5, "eval_steps_per_second": 3.359, "step": 84 }, { "epoch": 24.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2078908681869507, "eval_runtime": 0.7602, "eval_samples_per_second": 60.513, "eval_steps_per_second": 3.946, "step": 87 }, { "epoch": 25.71, "learning_rate": 0.0125, "loss": 1.2105, "step": 90 }, { "epoch": 26.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2138991355895996, "eval_runtime": 0.7567, "eval_samples_per_second": 60.792, "eval_steps_per_second": 3.965, "step": 91 }, { "epoch": 26.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2171320915222168, "eval_runtime": 0.8692, "eval_samples_per_second": 52.921, "eval_steps_per_second": 3.451, "step": 94 }, { "epoch": 28.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.218336820602417, "eval_runtime": 0.8997, "eval_samples_per_second": 51.128, "eval_steps_per_second": 3.334, "step": 98 }, { "epoch": 28.57, "learning_rate": 0.008333333333333333, "loss": 1.2095, "step": 100 }, { "epoch": 28.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2093594074249268, "eval_runtime": 0.7922, "eval_samples_per_second": 58.066, "eval_steps_per_second": 3.787, "step": 101 }, { "epoch": 30.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.206130862236023, "eval_runtime": 0.8217, "eval_samples_per_second": 55.981, "eval_steps_per_second": 3.651, "step": 105 }, { "epoch": 30.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2068984508514404, "eval_runtime": 0.7457, "eval_samples_per_second": 61.688, "eval_steps_per_second": 4.023, "step": 108 }, { "epoch": 31.43, "learning_rate": 0.004166666666666667, "loss": 1.203, "step": 110 }, { "epoch": 32.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2073019742965698, "eval_runtime": 0.7547, "eval_samples_per_second": 60.953, "eval_steps_per_second": 3.975, "step": 112 }, { "epoch": 32.86, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.207156777381897, "eval_runtime": 0.8097, "eval_samples_per_second": 56.811, "eval_steps_per_second": 3.705, "step": 115 }, { "epoch": 34.0, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2066789865493774, "eval_runtime": 0.7932, "eval_samples_per_second": 57.993, "eval_steps_per_second": 3.782, "step": 119 }, { "epoch": 34.29, "learning_rate": 0.0, "loss": 1.1996, "step": 120 }, { "epoch": 34.29, "eval_accuracy": 0.45652173913043476, "eval_loss": 1.2066394090652466, "eval_runtime": 0.7892, "eval_samples_per_second": 58.289, "eval_steps_per_second": 3.801, "step": 120 }, { "epoch": 34.29, "step": 120, "total_flos": 2.3770905934823424e+17, "train_loss": 2.8776248772939046, "train_runtime": 206.7662, "train_samples_per_second": 41.206, "train_steps_per_second": 0.58 } ], "logging_steps": 10, "max_steps": 120, "num_input_tokens_seen": 0, "num_train_epochs": 40, "save_steps": 500, "total_flos": 2.3770905934823424e+17, "train_batch_size": 16, "trial_name": null, "trial_params": null }