| { |
| "best_metric": 0.018954848870635033, |
| "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-Kontur-competition-1.3K/checkpoint-52", |
| "epoch": 12.631578947368421, |
| "eval_steps": 500, |
| "global_step": 60, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.84, |
| "eval_loss": 0.6833776235580444, |
| "eval_runtime": 3.0114, |
| "eval_samples_per_second": 44.165, |
| "eval_steps_per_second": 0.996, |
| "step": 4 |
| }, |
| { |
| "epoch": 1.89, |
| "eval_loss": 0.4898586869239807, |
| "eval_runtime": 3.4038, |
| "eval_samples_per_second": 39.074, |
| "eval_steps_per_second": 0.881, |
| "step": 9 |
| }, |
| { |
| "epoch": 2.11, |
| "grad_norm": 2.64339280128479, |
| "learning_rate": 4.62962962962963e-05, |
| "loss": 0.6773, |
| "step": 10 |
| }, |
| { |
| "epoch": 2.95, |
| "eval_loss": 0.2752000093460083, |
| "eval_runtime": 2.6262, |
| "eval_samples_per_second": 50.644, |
| "eval_steps_per_second": 1.142, |
| "step": 14 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_loss": 0.13112162053585052, |
| "eval_runtime": 2.6149, |
| "eval_samples_per_second": 50.862, |
| "eval_steps_per_second": 1.147, |
| "step": 19 |
| }, |
| { |
| "epoch": 4.21, |
| "grad_norm": 2.5273399353027344, |
| "learning_rate": 3.7037037037037037e-05, |
| "loss": 0.3528, |
| "step": 20 |
| }, |
| { |
| "epoch": 4.84, |
| "eval_loss": 0.08120357245206833, |
| "eval_runtime": 3.1533, |
| "eval_samples_per_second": 42.178, |
| "eval_steps_per_second": 0.951, |
| "step": 23 |
| }, |
| { |
| "epoch": 5.89, |
| "eval_loss": 0.04769232124090195, |
| "eval_runtime": 2.61, |
| "eval_samples_per_second": 50.958, |
| "eval_steps_per_second": 1.149, |
| "step": 28 |
| }, |
| { |
| "epoch": 6.32, |
| "grad_norm": 13.101208686828613, |
| "learning_rate": 2.777777777777778e-05, |
| "loss": 0.1595, |
| "step": 30 |
| }, |
| { |
| "epoch": 6.95, |
| "eval_loss": 0.028914544731378555, |
| "eval_runtime": 3.2525, |
| "eval_samples_per_second": 40.891, |
| "eval_steps_per_second": 0.922, |
| "step": 33 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_loss": 0.022866781800985336, |
| "eval_runtime": 2.636, |
| "eval_samples_per_second": 50.456, |
| "eval_steps_per_second": 1.138, |
| "step": 38 |
| }, |
| { |
| "epoch": 8.42, |
| "grad_norm": 7.744855880737305, |
| "learning_rate": 1.8518518518518518e-05, |
| "loss": 0.1054, |
| "step": 40 |
| }, |
| { |
| "epoch": 8.84, |
| "eval_loss": 0.02127755992114544, |
| "eval_runtime": 2.7818, |
| "eval_samples_per_second": 47.812, |
| "eval_steps_per_second": 1.078, |
| "step": 42 |
| }, |
| { |
| "epoch": 9.89, |
| "eval_loss": 0.028130069375038147, |
| "eval_runtime": 3.1605, |
| "eval_samples_per_second": 42.083, |
| "eval_steps_per_second": 0.949, |
| "step": 47 |
| }, |
| { |
| "epoch": 10.53, |
| "grad_norm": 4.180393695831299, |
| "learning_rate": 9.259259259259259e-06, |
| "loss": 0.0822, |
| "step": 50 |
| }, |
| { |
| "epoch": 10.95, |
| "eval_loss": 0.018954848870635033, |
| "eval_runtime": 3.079, |
| "eval_samples_per_second": 43.196, |
| "eval_steps_per_second": 0.974, |
| "step": 52 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_loss": 0.023994147777557373, |
| "eval_runtime": 2.9444, |
| "eval_samples_per_second": 45.17, |
| "eval_steps_per_second": 1.019, |
| "step": 57 |
| }, |
| { |
| "epoch": 12.63, |
| "grad_norm": 2.7027509212493896, |
| "learning_rate": 0.0, |
| "loss": 0.076, |
| "step": 60 |
| }, |
| { |
| "epoch": 12.63, |
| "eval_loss": 0.023665426298975945, |
| "eval_runtime": 3.0873, |
| "eval_samples_per_second": 43.079, |
| "eval_steps_per_second": 0.972, |
| "step": 60 |
| }, |
| { |
| "epoch": 12.63, |
| "step": 60, |
| "total_flos": 4.9113822316304794e+17, |
| "train_loss": 0.24218196471532186, |
| "train_runtime": 426.607, |
| "train_samples_per_second": 41.982, |
| "train_steps_per_second": 0.141 |
| } |
| ], |
| "logging_steps": 10, |
| "max_steps": 60, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 15, |
| "save_steps": 500, |
| "total_flos": 4.9113822316304794e+17, |
| "train_batch_size": 64, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|