| { |
| "best_metric": 0.75, |
| "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-dmae-humeda-DAV54/checkpoint-60", |
| "epoch": 33.38095238095238, |
| "eval_steps": 500, |
| "global_step": 100, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_accuracy": 0.19318181818181818, |
| "eval_loss": 1.585249423980713, |
| "eval_runtime": 1.4912, |
| "eval_samples_per_second": 59.014, |
| "eval_steps_per_second": 2.012, |
| "step": 3 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_accuracy": 0.3181818181818182, |
| "eval_loss": 1.578413486480713, |
| "eval_runtime": 1.5431, |
| "eval_samples_per_second": 57.028, |
| "eval_steps_per_second": 1.944, |
| "step": 6 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_accuracy": 0.4318181818181818, |
| "eval_loss": 1.537353515625, |
| "eval_runtime": 1.5969, |
| "eval_samples_per_second": 55.107, |
| "eval_steps_per_second": 1.879, |
| "step": 9 |
| }, |
| { |
| "epoch": 3.380952380952381, |
| "grad_norm": 3.083775520324707, |
| "learning_rate": 5e-05, |
| "loss": 1.3768, |
| "step": 10 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_accuracy": 0.4090909090909091, |
| "eval_loss": 1.4629433155059814, |
| "eval_runtime": 1.5346, |
| "eval_samples_per_second": 57.345, |
| "eval_steps_per_second": 1.955, |
| "step": 12 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_accuracy": 0.5340909090909091, |
| "eval_loss": 1.2221930027008057, |
| "eval_runtime": 2.5597, |
| "eval_samples_per_second": 34.379, |
| "eval_steps_per_second": 1.172, |
| "step": 15 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_accuracy": 0.5454545454545454, |
| "eval_loss": 1.2436859607696533, |
| "eval_runtime": 1.5399, |
| "eval_samples_per_second": 57.146, |
| "eval_steps_per_second": 1.948, |
| "step": 18 |
| }, |
| { |
| "epoch": 6.761904761904762, |
| "grad_norm": 4.605942249298096, |
| "learning_rate": 4.849231551964771e-05, |
| "loss": 0.942, |
| "step": 20 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_accuracy": 0.5340909090909091, |
| "eval_loss": 1.242801308631897, |
| "eval_runtime": 1.5797, |
| "eval_samples_per_second": 55.707, |
| "eval_steps_per_second": 1.899, |
| "step": 21 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_accuracy": 0.5340909090909091, |
| "eval_loss": 1.1750913858413696, |
| "eval_runtime": 2.5156, |
| "eval_samples_per_second": 34.982, |
| "eval_steps_per_second": 1.193, |
| "step": 24 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_accuracy": 0.5795454545454546, |
| "eval_loss": 1.1278696060180664, |
| "eval_runtime": 2.3024, |
| "eval_samples_per_second": 38.222, |
| "eval_steps_per_second": 1.303, |
| "step": 27 |
| }, |
| { |
| "epoch": 10.0, |
| "grad_norm": 6.71976900100708, |
| "learning_rate": 4.415111107797445e-05, |
| "loss": 0.6265, |
| "step": 30 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_accuracy": 0.6477272727272727, |
| "eval_loss": 0.9868423342704773, |
| "eval_runtime": 2.2207, |
| "eval_samples_per_second": 39.627, |
| "eval_steps_per_second": 1.351, |
| "step": 30 |
| }, |
| { |
| "epoch": 11.0, |
| "eval_accuracy": 0.6363636363636364, |
| "eval_loss": 0.9661000967025757, |
| "eval_runtime": 2.178, |
| "eval_samples_per_second": 40.404, |
| "eval_steps_per_second": 1.377, |
| "step": 33 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_accuracy": 0.6136363636363636, |
| "eval_loss": 0.9892013669013977, |
| "eval_runtime": 2.2016, |
| "eval_samples_per_second": 39.97, |
| "eval_steps_per_second": 1.363, |
| "step": 36 |
| }, |
| { |
| "epoch": 13.0, |
| "eval_accuracy": 0.6818181818181818, |
| "eval_loss": 0.87156081199646, |
| "eval_runtime": 1.6274, |
| "eval_samples_per_second": 54.073, |
| "eval_steps_per_second": 1.843, |
| "step": 39 |
| }, |
| { |
| "epoch": 13.380952380952381, |
| "grad_norm": 6.5638837814331055, |
| "learning_rate": 3.7500000000000003e-05, |
| "loss": 0.5106, |
| "step": 40 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_accuracy": 0.7272727272727273, |
| "eval_loss": 0.8009552359580994, |
| "eval_runtime": 1.5443, |
| "eval_samples_per_second": 56.984, |
| "eval_steps_per_second": 1.943, |
| "step": 42 |
| }, |
| { |
| "epoch": 15.0, |
| "eval_accuracy": 0.6818181818181818, |
| "eval_loss": 0.8596124053001404, |
| "eval_runtime": 1.5414, |
| "eval_samples_per_second": 57.091, |
| "eval_steps_per_second": 1.946, |
| "step": 45 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_accuracy": 0.6931818181818182, |
| "eval_loss": 0.8257151246070862, |
| "eval_runtime": 2.2212, |
| "eval_samples_per_second": 39.619, |
| "eval_steps_per_second": 1.351, |
| "step": 48 |
| }, |
| { |
| "epoch": 16.761904761904763, |
| "grad_norm": 5.321930885314941, |
| "learning_rate": 2.9341204441673266e-05, |
| "loss": 0.4183, |
| "step": 50 |
| }, |
| { |
| "epoch": 17.0, |
| "eval_accuracy": 0.7045454545454546, |
| "eval_loss": 0.8189888000488281, |
| "eval_runtime": 1.5383, |
| "eval_samples_per_second": 57.207, |
| "eval_steps_per_second": 1.95, |
| "step": 51 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_accuracy": 0.7272727272727273, |
| "eval_loss": 0.7627521753311157, |
| "eval_runtime": 2.2402, |
| "eval_samples_per_second": 39.283, |
| "eval_steps_per_second": 1.339, |
| "step": 54 |
| }, |
| { |
| "epoch": 19.0, |
| "eval_accuracy": 0.7159090909090909, |
| "eval_loss": 0.7801702618598938, |
| "eval_runtime": 2.2768, |
| "eval_samples_per_second": 38.651, |
| "eval_steps_per_second": 1.318, |
| "step": 57 |
| }, |
| { |
| "epoch": 20.0, |
| "grad_norm": 3.8304524421691895, |
| "learning_rate": 2.0658795558326743e-05, |
| "loss": 0.3267, |
| "step": 60 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_accuracy": 0.75, |
| "eval_loss": 0.7753319144248962, |
| "eval_runtime": 2.3302, |
| "eval_samples_per_second": 37.766, |
| "eval_steps_per_second": 1.287, |
| "step": 60 |
| }, |
| { |
| "epoch": 21.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.7770728468894958, |
| "eval_runtime": 2.2672, |
| "eval_samples_per_second": 38.815, |
| "eval_steps_per_second": 1.323, |
| "step": 63 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_accuracy": 0.75, |
| "eval_loss": 0.7770181894302368, |
| "eval_runtime": 2.3268, |
| "eval_samples_per_second": 37.821, |
| "eval_steps_per_second": 1.289, |
| "step": 66 |
| }, |
| { |
| "epoch": 23.0, |
| "eval_accuracy": 0.7272727272727273, |
| "eval_loss": 0.7940635681152344, |
| "eval_runtime": 2.2104, |
| "eval_samples_per_second": 39.812, |
| "eval_steps_per_second": 1.357, |
| "step": 69 |
| }, |
| { |
| "epoch": 23.38095238095238, |
| "grad_norm": 5.505289077758789, |
| "learning_rate": 1.2500000000000006e-05, |
| "loss": 0.3008, |
| "step": 70 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_accuracy": 0.7272727272727273, |
| "eval_loss": 0.7921419739723206, |
| "eval_runtime": 2.1726, |
| "eval_samples_per_second": 40.505, |
| "eval_steps_per_second": 1.381, |
| "step": 72 |
| }, |
| { |
| "epoch": 25.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.7899277210235596, |
| "eval_runtime": 2.2223, |
| "eval_samples_per_second": 39.599, |
| "eval_steps_per_second": 1.35, |
| "step": 75 |
| }, |
| { |
| "epoch": 26.0, |
| "eval_accuracy": 0.75, |
| "eval_loss": 0.7849180698394775, |
| "eval_runtime": 2.1648, |
| "eval_samples_per_second": 40.65, |
| "eval_steps_per_second": 1.386, |
| "step": 78 |
| }, |
| { |
| "epoch": 26.761904761904763, |
| "grad_norm": 5.414725303649902, |
| "learning_rate": 5.848888922025553e-06, |
| "loss": 0.2795, |
| "step": 80 |
| }, |
| { |
| "epoch": 27.0, |
| "eval_accuracy": 0.75, |
| "eval_loss": 0.7891153693199158, |
| "eval_runtime": 2.2542, |
| "eval_samples_per_second": 39.038, |
| "eval_steps_per_second": 1.331, |
| "step": 81 |
| }, |
| { |
| "epoch": 28.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.7973006963729858, |
| "eval_runtime": 2.205, |
| "eval_samples_per_second": 39.909, |
| "eval_steps_per_second": 1.361, |
| "step": 84 |
| }, |
| { |
| "epoch": 29.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.8067693710327148, |
| "eval_runtime": 2.1816, |
| "eval_samples_per_second": 40.338, |
| "eval_steps_per_second": 1.375, |
| "step": 87 |
| }, |
| { |
| "epoch": 30.0, |
| "grad_norm": 4.411905765533447, |
| "learning_rate": 1.5076844803522922e-06, |
| "loss": 0.2526, |
| "step": 90 |
| }, |
| { |
| "epoch": 30.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.8087642788887024, |
| "eval_runtime": 1.5036, |
| "eval_samples_per_second": 58.526, |
| "eval_steps_per_second": 1.995, |
| "step": 90 |
| }, |
| { |
| "epoch": 31.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.8097642660140991, |
| "eval_runtime": 1.8153, |
| "eval_samples_per_second": 48.476, |
| "eval_steps_per_second": 1.653, |
| "step": 93 |
| }, |
| { |
| "epoch": 32.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.8095622658729553, |
| "eval_runtime": 1.82, |
| "eval_samples_per_second": 48.352, |
| "eval_steps_per_second": 1.648, |
| "step": 96 |
| }, |
| { |
| "epoch": 33.0, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.8095269799232483, |
| "eval_runtime": 1.7559, |
| "eval_samples_per_second": 50.118, |
| "eval_steps_per_second": 1.709, |
| "step": 99 |
| }, |
| { |
| "epoch": 33.38095238095238, |
| "grad_norm": 5.03811502456665, |
| "learning_rate": 0.0, |
| "loss": 0.2544, |
| "step": 100 |
| }, |
| { |
| "epoch": 33.38095238095238, |
| "eval_accuracy": 0.7386363636363636, |
| "eval_loss": 0.8093982338905334, |
| "eval_runtime": 1.7511, |
| "eval_samples_per_second": 50.253, |
| "eval_steps_per_second": 1.713, |
| "step": 100 |
| }, |
| { |
| "epoch": 33.38095238095238, |
| "step": 100, |
| "total_flos": 7.202076007838515e+17, |
| "train_loss": 0.5288270854949951, |
| "train_runtime": 627.2045, |
| "train_samples_per_second": 52.854, |
| "train_steps_per_second": 0.159 |
| } |
| ], |
| "logging_steps": 10, |
| "max_steps": 100, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 50, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 7.202076007838515e+17, |
| "train_batch_size": 32, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|