| { |
| "best_metric": 0.7307692307692307, |
| "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-dmae-humeda-DAV56/checkpoint-128", |
| "epoch": 44.8421052631579, |
| "eval_steps": 500, |
| "global_step": 180, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.8421052631578947, |
| "eval_accuracy": 0.3269230769230769, |
| "eval_loss": 1.5618427991867065, |
| "eval_runtime": 0.8649, |
| "eval_samples_per_second": 60.123, |
| "eval_steps_per_second": 2.312, |
| "step": 4 |
| }, |
| { |
| "epoch": 1.8421052631578947, |
| "eval_accuracy": 0.4423076923076923, |
| "eval_loss": 1.5395886898040771, |
| "eval_runtime": 0.8206, |
| "eval_samples_per_second": 63.366, |
| "eval_steps_per_second": 2.437, |
| "step": 8 |
| }, |
| { |
| "epoch": 2.8421052631578947, |
| "grad_norm": 3.157193660736084, |
| "learning_rate": 1.3333333333333333e-05, |
| "loss": 1.7209, |
| "step": 12 |
| }, |
| { |
| "epoch": 2.8421052631578947, |
| "eval_accuracy": 0.3076923076923077, |
| "eval_loss": 1.5123951435089111, |
| "eval_runtime": 0.8398, |
| "eval_samples_per_second": 61.921, |
| "eval_steps_per_second": 2.382, |
| "step": 12 |
| }, |
| { |
| "epoch": 3.8421052631578947, |
| "eval_accuracy": 0.3269230769230769, |
| "eval_loss": 1.4679234027862549, |
| "eval_runtime": 1.2246, |
| "eval_samples_per_second": 42.462, |
| "eval_steps_per_second": 1.633, |
| "step": 16 |
| }, |
| { |
| "epoch": 4.842105263157895, |
| "eval_accuracy": 0.34615384615384615, |
| "eval_loss": 1.412973165512085, |
| "eval_runtime": 0.8428, |
| "eval_samples_per_second": 61.701, |
| "eval_steps_per_second": 2.373, |
| "step": 20 |
| }, |
| { |
| "epoch": 5.842105263157895, |
| "grad_norm": 4.583027362823486, |
| "learning_rate": 1.9932383577419432e-05, |
| "loss": 1.5864, |
| "step": 24 |
| }, |
| { |
| "epoch": 5.842105263157895, |
| "eval_accuracy": 0.5384615384615384, |
| "eval_loss": 1.31065034866333, |
| "eval_runtime": 0.8266, |
| "eval_samples_per_second": 62.908, |
| "eval_steps_per_second": 2.42, |
| "step": 24 |
| }, |
| { |
| "epoch": 6.842105263157895, |
| "eval_accuracy": 0.5384615384615384, |
| "eval_loss": 1.2111910581588745, |
| "eval_runtime": 0.8228, |
| "eval_samples_per_second": 63.201, |
| "eval_steps_per_second": 2.431, |
| "step": 28 |
| }, |
| { |
| "epoch": 7.842105263157895, |
| "eval_accuracy": 0.5961538461538461, |
| "eval_loss": 1.119398832321167, |
| "eval_runtime": 0.8365, |
| "eval_samples_per_second": 62.162, |
| "eval_steps_per_second": 2.391, |
| "step": 32 |
| }, |
| { |
| "epoch": 8.842105263157894, |
| "grad_norm": 5.296598434448242, |
| "learning_rate": 1.9396926207859085e-05, |
| "loss": 1.2629, |
| "step": 36 |
| }, |
| { |
| "epoch": 8.842105263157894, |
| "eval_accuracy": 0.5961538461538461, |
| "eval_loss": 1.0421706438064575, |
| "eval_runtime": 1.1444, |
| "eval_samples_per_second": 45.439, |
| "eval_steps_per_second": 1.748, |
| "step": 36 |
| }, |
| { |
| "epoch": 9.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.9705998301506042, |
| "eval_runtime": 1.1966, |
| "eval_samples_per_second": 43.458, |
| "eval_steps_per_second": 1.671, |
| "step": 40 |
| }, |
| { |
| "epoch": 10.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.9637848734855652, |
| "eval_runtime": 0.8287, |
| "eval_samples_per_second": 62.751, |
| "eval_steps_per_second": 2.414, |
| "step": 44 |
| }, |
| { |
| "epoch": 11.842105263157894, |
| "grad_norm": 8.424572944641113, |
| "learning_rate": 1.8354878114129368e-05, |
| "loss": 0.951, |
| "step": 48 |
| }, |
| { |
| "epoch": 11.842105263157894, |
| "eval_accuracy": 0.6153846153846154, |
| "eval_loss": 0.9906312227249146, |
| "eval_runtime": 0.8344, |
| "eval_samples_per_second": 62.318, |
| "eval_steps_per_second": 2.397, |
| "step": 48 |
| }, |
| { |
| "epoch": 12.842105263157894, |
| "eval_accuracy": 0.5961538461538461, |
| "eval_loss": 0.988998532295227, |
| "eval_runtime": 0.8289, |
| "eval_samples_per_second": 62.73, |
| "eval_steps_per_second": 2.413, |
| "step": 52 |
| }, |
| { |
| "epoch": 13.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.9109674692153931, |
| "eval_runtime": 0.8337, |
| "eval_samples_per_second": 62.374, |
| "eval_steps_per_second": 2.399, |
| "step": 56 |
| }, |
| { |
| "epoch": 14.842105263157894, |
| "grad_norm": 13.505391120910645, |
| "learning_rate": 1.686241637868734e-05, |
| "loss": 0.7947, |
| "step": 60 |
| }, |
| { |
| "epoch": 14.842105263157894, |
| "eval_accuracy": 0.6730769230769231, |
| "eval_loss": 0.9282015562057495, |
| "eval_runtime": 1.167, |
| "eval_samples_per_second": 44.559, |
| "eval_steps_per_second": 1.714, |
| "step": 60 |
| }, |
| { |
| "epoch": 15.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.931515634059906, |
| "eval_runtime": 0.8621, |
| "eval_samples_per_second": 60.315, |
| "eval_steps_per_second": 2.32, |
| "step": 64 |
| }, |
| { |
| "epoch": 16.842105263157894, |
| "eval_accuracy": 0.6153846153846154, |
| "eval_loss": 0.9229909181594849, |
| "eval_runtime": 0.8464, |
| "eval_samples_per_second": 61.434, |
| "eval_steps_per_second": 2.363, |
| "step": 68 |
| }, |
| { |
| "epoch": 17.842105263157894, |
| "grad_norm": 8.060040473937988, |
| "learning_rate": 1.5000000000000002e-05, |
| "loss": 0.7143, |
| "step": 72 |
| }, |
| { |
| "epoch": 17.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.9067614674568176, |
| "eval_runtime": 0.8349, |
| "eval_samples_per_second": 62.281, |
| "eval_steps_per_second": 2.395, |
| "step": 72 |
| }, |
| { |
| "epoch": 18.842105263157894, |
| "eval_accuracy": 0.6153846153846154, |
| "eval_loss": 0.8996807932853699, |
| "eval_runtime": 0.8415, |
| "eval_samples_per_second": 61.795, |
| "eval_steps_per_second": 2.377, |
| "step": 76 |
| }, |
| { |
| "epoch": 19.842105263157894, |
| "eval_accuracy": 0.6923076923076923, |
| "eval_loss": 0.8648480772972107, |
| "eval_runtime": 1.1842, |
| "eval_samples_per_second": 43.912, |
| "eval_steps_per_second": 1.689, |
| "step": 80 |
| }, |
| { |
| "epoch": 20.842105263157894, |
| "grad_norm": 6.491458415985107, |
| "learning_rate": 1.2868032327110904e-05, |
| "loss": 0.6329, |
| "step": 84 |
| }, |
| { |
| "epoch": 20.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.8624066710472107, |
| "eval_runtime": 1.178, |
| "eval_samples_per_second": 44.142, |
| "eval_steps_per_second": 1.698, |
| "step": 84 |
| }, |
| { |
| "epoch": 21.842105263157894, |
| "eval_accuracy": 0.6153846153846154, |
| "eval_loss": 0.8736539483070374, |
| "eval_runtime": 1.2262, |
| "eval_samples_per_second": 42.407, |
| "eval_steps_per_second": 1.631, |
| "step": 88 |
| }, |
| { |
| "epoch": 22.842105263157894, |
| "eval_accuracy": 0.6730769230769231, |
| "eval_loss": 0.8636062145233154, |
| "eval_runtime": 0.9335, |
| "eval_samples_per_second": 55.703, |
| "eval_steps_per_second": 2.142, |
| "step": 92 |
| }, |
| { |
| "epoch": 23.842105263157894, |
| "grad_norm": 13.519357681274414, |
| "learning_rate": 1.0581448289104759e-05, |
| "loss": 0.5508, |
| "step": 96 |
| }, |
| { |
| "epoch": 23.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.8544560074806213, |
| "eval_runtime": 0.8147, |
| "eval_samples_per_second": 63.826, |
| "eval_steps_per_second": 2.455, |
| "step": 96 |
| }, |
| { |
| "epoch": 24.842105263157894, |
| "eval_accuracy": 0.6730769230769231, |
| "eval_loss": 0.8616629838943481, |
| "eval_runtime": 0.8014, |
| "eval_samples_per_second": 64.887, |
| "eval_steps_per_second": 2.496, |
| "step": 100 |
| }, |
| { |
| "epoch": 25.842105263157894, |
| "eval_accuracy": 0.6346153846153846, |
| "eval_loss": 0.8635188341140747, |
| "eval_runtime": 0.8235, |
| "eval_samples_per_second": 63.142, |
| "eval_steps_per_second": 2.429, |
| "step": 104 |
| }, |
| { |
| "epoch": 26.842105263157894, |
| "grad_norm": 8.143542289733887, |
| "learning_rate": 8.263518223330698e-06, |
| "loss": 0.5009, |
| "step": 108 |
| }, |
| { |
| "epoch": 26.842105263157894, |
| "eval_accuracy": 0.6346153846153846, |
| "eval_loss": 0.8650462627410889, |
| "eval_runtime": 0.8227, |
| "eval_samples_per_second": 63.207, |
| "eval_steps_per_second": 2.431, |
| "step": 108 |
| }, |
| { |
| "epoch": 27.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.8637959361076355, |
| "eval_runtime": 1.2141, |
| "eval_samples_per_second": 42.831, |
| "eval_steps_per_second": 1.647, |
| "step": 112 |
| }, |
| { |
| "epoch": 28.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.873045802116394, |
| "eval_runtime": 1.1581, |
| "eval_samples_per_second": 44.901, |
| "eval_steps_per_second": 1.727, |
| "step": 116 |
| }, |
| { |
| "epoch": 29.842105263157894, |
| "grad_norm": 10.985040664672852, |
| "learning_rate": 6.039202339608432e-06, |
| "loss": 0.5286, |
| "step": 120 |
| }, |
| { |
| "epoch": 29.842105263157894, |
| "eval_accuracy": 0.6346153846153846, |
| "eval_loss": 0.8886079788208008, |
| "eval_runtime": 1.168, |
| "eval_samples_per_second": 44.522, |
| "eval_steps_per_second": 1.712, |
| "step": 120 |
| }, |
| { |
| "epoch": 30.842105263157894, |
| "eval_accuracy": 0.6538461538461539, |
| "eval_loss": 0.882747232913971, |
| "eval_runtime": 1.0188, |
| "eval_samples_per_second": 51.04, |
| "eval_steps_per_second": 1.963, |
| "step": 124 |
| }, |
| { |
| "epoch": 31.842105263157894, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8747740983963013, |
| "eval_runtime": 0.8145, |
| "eval_samples_per_second": 63.847, |
| "eval_steps_per_second": 2.456, |
| "step": 128 |
| }, |
| { |
| "epoch": 32.8421052631579, |
| "grad_norm": 7.003128528594971, |
| "learning_rate": 4.028414082972141e-06, |
| "loss": 0.4559, |
| "step": 132 |
| }, |
| { |
| "epoch": 32.8421052631579, |
| "eval_accuracy": 0.7115384615384616, |
| "eval_loss": 0.8670610785484314, |
| "eval_runtime": 0.8405, |
| "eval_samples_per_second": 61.865, |
| "eval_steps_per_second": 2.379, |
| "step": 132 |
| }, |
| { |
| "epoch": 33.8421052631579, |
| "eval_accuracy": 0.6730769230769231, |
| "eval_loss": 0.8727457523345947, |
| "eval_runtime": 0.8367, |
| "eval_samples_per_second": 62.15, |
| "eval_steps_per_second": 2.39, |
| "step": 136 |
| }, |
| { |
| "epoch": 34.8421052631579, |
| "eval_accuracy": 0.7115384615384616, |
| "eval_loss": 0.8754667043685913, |
| "eval_runtime": 0.8489, |
| "eval_samples_per_second": 61.254, |
| "eval_steps_per_second": 2.356, |
| "step": 140 |
| }, |
| { |
| "epoch": 35.8421052631579, |
| "grad_norm": 7.350639343261719, |
| "learning_rate": 2.339555568810221e-06, |
| "loss": 0.4704, |
| "step": 144 |
| }, |
| { |
| "epoch": 35.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8759797215461731, |
| "eval_runtime": 0.845, |
| "eval_samples_per_second": 61.538, |
| "eval_steps_per_second": 2.367, |
| "step": 144 |
| }, |
| { |
| "epoch": 36.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8786163330078125, |
| "eval_runtime": 1.2012, |
| "eval_samples_per_second": 43.291, |
| "eval_steps_per_second": 1.665, |
| "step": 148 |
| }, |
| { |
| "epoch": 37.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.878113329410553, |
| "eval_runtime": 0.8301, |
| "eval_samples_per_second": 62.641, |
| "eval_steps_per_second": 2.409, |
| "step": 152 |
| }, |
| { |
| "epoch": 38.8421052631579, |
| "grad_norm": 10.532869338989258, |
| "learning_rate": 1.0636735967658785e-06, |
| "loss": 0.4582, |
| "step": 156 |
| }, |
| { |
| "epoch": 38.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8771308660507202, |
| "eval_runtime": 0.807, |
| "eval_samples_per_second": 64.435, |
| "eval_steps_per_second": 2.478, |
| "step": 156 |
| }, |
| { |
| "epoch": 39.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8753777146339417, |
| "eval_runtime": 0.8106, |
| "eval_samples_per_second": 64.147, |
| "eval_steps_per_second": 2.467, |
| "step": 160 |
| }, |
| { |
| "epoch": 40.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8740986585617065, |
| "eval_runtime": 1.1627, |
| "eval_samples_per_second": 44.725, |
| "eval_steps_per_second": 1.72, |
| "step": 164 |
| }, |
| { |
| "epoch": 41.8421052631579, |
| "grad_norm": 6.582579135894775, |
| "learning_rate": 2.6955129420176193e-07, |
| "loss": 0.4538, |
| "step": 168 |
| }, |
| { |
| "epoch": 41.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8742378950119019, |
| "eval_runtime": 0.8152, |
| "eval_samples_per_second": 63.791, |
| "eval_steps_per_second": 2.453, |
| "step": 168 |
| }, |
| { |
| "epoch": 42.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.873984694480896, |
| "eval_runtime": 0.8202, |
| "eval_samples_per_second": 63.397, |
| "eval_steps_per_second": 2.438, |
| "step": 172 |
| }, |
| { |
| "epoch": 43.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8740047216415405, |
| "eval_runtime": 0.8433, |
| "eval_samples_per_second": 61.665, |
| "eval_steps_per_second": 2.372, |
| "step": 176 |
| }, |
| { |
| "epoch": 44.8421052631579, |
| "grad_norm": 7.687587738037109, |
| "learning_rate": 1.8802955149865854e-09, |
| "loss": 0.4476, |
| "step": 180 |
| }, |
| { |
| "epoch": 44.8421052631579, |
| "eval_accuracy": 0.7307692307692307, |
| "eval_loss": 0.8741353750228882, |
| "eval_runtime": 1.1096, |
| "eval_samples_per_second": 46.864, |
| "eval_steps_per_second": 1.802, |
| "step": 180 |
| }, |
| { |
| "epoch": 44.8421052631579, |
| "step": 180, |
| "total_flos": 8.412779636714373e+17, |
| "train_loss": 0.7686147186491225, |
| "train_runtime": 536.055, |
| "train_samples_per_second": 50.872, |
| "train_steps_per_second": 0.336 |
| } |
| ], |
| "logging_steps": 12, |
| "max_steps": 180, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 45, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 8.412779636714373e+17, |
| "train_batch_size": 32, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|