| { | |
| "best_metric": 0.8677685950413223, | |
| "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM/NMM_Classification_base_V10/checkpoint-76", | |
| "epoch": 6.885245901639344, | |
| "eval_steps": 500, | |
| "global_step": 105, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.6557377049180327, | |
| "grad_norm": 4.473873615264893, | |
| "learning_rate": 4.545454545454546e-05, | |
| "loss": 0.8448, | |
| "step": 10 | |
| }, | |
| { | |
| "epoch": 0.9836065573770492, | |
| "step": 15, | |
| "train_accuracy": 0.8035137579124144, | |
| "train_auc_class_0": 0.9088436086296741, | |
| "train_auc_class_1": 0.8379446511466175, | |
| "train_auc_class_2": 0.8758602364377229, | |
| "train_auc_overall": 0.8742161654046715, | |
| "train_loss": 0.49683675169944763, | |
| "train_runtime": 777.5048, | |
| "train_samples_per_second": 9.956, | |
| "train_steps_per_second": 0.078 | |
| }, | |
| { | |
| "epoch": 0.9836065573770492, | |
| "eval_accuracy": 0.8362603305785123, | |
| "eval_auc_class_0": 0.9403517055860806, | |
| "eval_auc_class_1": 0.8605572313411073, | |
| "eval_auc_class_2": 0.8997462510986076, | |
| "eval_auc_overall": 0.9002183960085985, | |
| "eval_loss": 0.44267916679382324, | |
| "eval_runtime": 267.5178, | |
| "eval_samples_per_second": 7.237, | |
| "eval_steps_per_second": 0.06, | |
| "step": 15 | |
| }, | |
| { | |
| "epoch": 1.3114754098360657, | |
| "grad_norm": 2.1386613845825195, | |
| "learning_rate": 4.5212765957446815e-05, | |
| "loss": 0.512, | |
| "step": 20 | |
| }, | |
| { | |
| "epoch": 1.9672131147540983, | |
| "grad_norm": 1.435038685798645, | |
| "learning_rate": 3.9893617021276594e-05, | |
| "loss": 0.4434, | |
| "step": 30 | |
| }, | |
| { | |
| "epoch": 1.9672131147540983, | |
| "step": 30, | |
| "train_accuracy": 0.840201524350859, | |
| "train_auc_class_0": 0.9414490637347536, | |
| "train_auc_class_1": 0.8997057391727663, | |
| "train_auc_class_2": 0.9139346212557102, | |
| "train_auc_overall": 0.9183631413877434, | |
| "train_loss": 0.4013007879257202, | |
| "train_runtime": 714.2886, | |
| "train_samples_per_second": 10.837, | |
| "train_steps_per_second": 0.085 | |
| }, | |
| { | |
| "epoch": 1.9672131147540983, | |
| "eval_accuracy": 0.8445247933884298, | |
| "eval_auc_class_0": 0.9560139079670331, | |
| "eval_auc_class_1": 0.9042625890669138, | |
| "eval_auc_class_2": 0.9195875061825728, | |
| "eval_auc_overall": 0.9266213344055066, | |
| "eval_loss": 0.3872886896133423, | |
| "eval_runtime": 214.551, | |
| "eval_samples_per_second": 9.023, | |
| "eval_steps_per_second": 0.075, | |
| "step": 30 | |
| }, | |
| { | |
| "epoch": 2.6229508196721314, | |
| "grad_norm": 2.210986852645874, | |
| "learning_rate": 3.4574468085106386e-05, | |
| "loss": 0.3979, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 2.9508196721311473, | |
| "step": 45, | |
| "train_accuracy": 0.8537656633509882, | |
| "train_auc_class_0": 0.9565036613124893, | |
| "train_auc_class_1": 0.9187875975798461, | |
| "train_auc_class_2": 0.9285740636485835, | |
| "train_auc_overall": 0.9346217741803063, | |
| "train_loss": 0.3611737787723541, | |
| "train_runtime": 704.8242, | |
| "train_samples_per_second": 10.983, | |
| "train_steps_per_second": 0.087 | |
| }, | |
| { | |
| "epoch": 2.9508196721311473, | |
| "eval_accuracy": 0.8584710743801653, | |
| "eval_auc_class_0": 0.9593907394688643, | |
| "eval_auc_class_1": 0.9080973087319308, | |
| "eval_auc_class_2": 0.9256975615561118, | |
| "eval_auc_overall": 0.931061869918969, | |
| "eval_loss": 0.36146315932273865, | |
| "eval_runtime": 207.9281, | |
| "eval_samples_per_second": 9.311, | |
| "eval_steps_per_second": 0.077, | |
| "step": 45 | |
| }, | |
| { | |
| "epoch": 3.278688524590164, | |
| "grad_norm": 2.5246520042419434, | |
| "learning_rate": 2.925531914893617e-05, | |
| "loss": 0.3733, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 3.9344262295081966, | |
| "grad_norm": 2.381304979324341, | |
| "learning_rate": 2.393617021276596e-05, | |
| "loss": 0.3593, | |
| "step": 60 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "step": 61, | |
| "train_accuracy": 0.865779615036817, | |
| "train_auc_class_0": 0.9630790814865717, | |
| "train_auc_class_1": 0.9318475950588521, | |
| "train_auc_class_2": 0.9373109719652593, | |
| "train_auc_overall": 0.9440792161702277, | |
| "train_loss": 0.33730149269104004, | |
| "train_runtime": 698.4574, | |
| "train_samples_per_second": 11.083, | |
| "train_steps_per_second": 0.087 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.862603305785124, | |
| "eval_auc_class_0": 0.9629407051282051, | |
| "eval_auc_class_1": 0.9201237904963373, | |
| "eval_auc_class_2": 0.9316191956643276, | |
| "eval_auc_overall": 0.9382278970962901, | |
| "eval_loss": 0.34607622027397156, | |
| "eval_runtime": 206.0574, | |
| "eval_samples_per_second": 9.395, | |
| "eval_steps_per_second": 0.078, | |
| "step": 61 | |
| }, | |
| { | |
| "epoch": 4.590163934426229, | |
| "grad_norm": 2.1240530014038086, | |
| "learning_rate": 1.8617021276595745e-05, | |
| "loss": 0.3473, | |
| "step": 70 | |
| }, | |
| { | |
| "epoch": 4.983606557377049, | |
| "step": 76, | |
| "train_accuracy": 0.8688799896654179, | |
| "train_auc_class_0": 0.9654619767508447, | |
| "train_auc_class_1": 0.9391473390475861, | |
| "train_auc_class_2": 0.9405490167752112, | |
| "train_auc_overall": 0.9483861108578807, | |
| "train_loss": 0.32362109422683716, | |
| "train_runtime": 706.7637, | |
| "train_samples_per_second": 10.953, | |
| "train_steps_per_second": 0.086 | |
| }, | |
| { | |
| "epoch": 4.983606557377049, | |
| "eval_accuracy": 0.8677685950413223, | |
| "eval_auc_class_0": 0.9631310096153847, | |
| "eval_auc_class_1": 0.9189268008165645, | |
| "eval_auc_class_2": 0.9322997435239486, | |
| "eval_auc_overall": 0.938119184651966, | |
| "eval_loss": 0.34411147236824036, | |
| "eval_runtime": 207.2323, | |
| "eval_samples_per_second": 9.342, | |
| "eval_steps_per_second": 0.077, | |
| "step": 76 | |
| }, | |
| { | |
| "epoch": 5.245901639344262, | |
| "grad_norm": 2.395565986633301, | |
| "learning_rate": 1.3297872340425532e-05, | |
| "loss": 0.3381, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 5.901639344262295, | |
| "grad_norm": 1.6295080184936523, | |
| "learning_rate": 7.97872340425532e-06, | |
| "loss": 0.3318, | |
| "step": 90 | |
| }, | |
| { | |
| "epoch": 5.967213114754099, | |
| "step": 91, | |
| "train_accuracy": 0.8766309262369203, | |
| "train_auc_class_0": 0.9675600734409895, | |
| "train_auc_class_1": 0.9360009866648122, | |
| "train_auc_class_2": 0.9450547274524197, | |
| "train_auc_overall": 0.9495385958527405, | |
| "train_loss": 0.31677091121673584, | |
| "train_runtime": 712.6133, | |
| "train_samples_per_second": 10.863, | |
| "train_steps_per_second": 0.086 | |
| }, | |
| { | |
| "epoch": 5.967213114754099, | |
| "eval_accuracy": 0.8667355371900827, | |
| "eval_auc_class_0": 0.9631009615384616, | |
| "eval_auc_class_1": 0.916550232215998, | |
| "eval_auc_class_2": 0.9317034893882878, | |
| "eval_auc_overall": 0.9371182277142491, | |
| "eval_loss": 0.34614038467407227, | |
| "eval_runtime": 209.8829, | |
| "eval_samples_per_second": 9.224, | |
| "eval_steps_per_second": 0.076, | |
| "step": 91 | |
| }, | |
| { | |
| "epoch": 6.557377049180328, | |
| "grad_norm": 3.0411829948425293, | |
| "learning_rate": 2.6595744680851065e-06, | |
| "loss": 0.3147, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 6.885245901639344, | |
| "step": 105, | |
| "train_accuracy": 0.8770184730654954, | |
| "train_auc_class_0": 0.9688894018782569, | |
| "train_auc_class_1": 0.9353519937583671, | |
| "train_auc_class_2": 0.9460088191382243, | |
| "train_auc_overall": 0.9500834049249495, | |
| "train_loss": 0.3142475485801697, | |
| "train_runtime": 690.6226, | |
| "train_samples_per_second": 11.209, | |
| "train_steps_per_second": 0.088 | |
| }, | |
| { | |
| "epoch": 6.885245901639344, | |
| "eval_accuracy": 0.862603305785124, | |
| "eval_auc_class_0": 0.9628863324175823, | |
| "eval_auc_class_1": 0.9189616223345215, | |
| "eval_auc_class_2": 0.93194521403788, | |
| "eval_auc_overall": 0.937931056263328, | |
| "eval_loss": 0.3451487123966217, | |
| "eval_runtime": 207.6543, | |
| "eval_samples_per_second": 9.323, | |
| "eval_steps_per_second": 0.077, | |
| "step": 105 | |
| }, | |
| { | |
| "epoch": 6.885245901639344, | |
| "step": 105, | |
| "total_flos": 4.180411553219629e+18, | |
| "train_loss": 0.4214494603020804, | |
| "train_runtime": 12181.9025, | |
| "train_samples_per_second": 4.448, | |
| "train_steps_per_second": 0.009 | |
| } | |
| ], | |
| "logging_steps": 10, | |
| "max_steps": 105, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 7, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 4.180411553219629e+18, | |
| "train_batch_size": 128, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |