| { |
| "best_metric": 84.05797101449275, |
| "best_model_checkpoint": "outputs/bitfit/t5-base/rte/checkpoint-300", |
| "epoch": 20.0, |
| "global_step": 1560, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.28, |
| "eval_accuracy": 76.81159420289855, |
| "eval_average_metrics": 76.81159420289855, |
| "eval_loss": 0.21982769668102264, |
| "eval_runtime": 1.0149, |
| "eval_samples_per_second": 135.972, |
| "step": 100 |
| }, |
| { |
| "epoch": 2.56, |
| "eval_accuracy": 78.26086956521739, |
| "eval_average_metrics": 78.26086956521739, |
| "eval_loss": 0.18932242691516876, |
| "eval_runtime": 0.6715, |
| "eval_samples_per_second": 205.52, |
| "step": 200 |
| }, |
| { |
| "epoch": 3.85, |
| "eval_accuracy": 84.05797101449275, |
| "eval_average_metrics": 84.05797101449275, |
| "eval_loss": 0.16963252425193787, |
| "eval_runtime": 0.8653, |
| "eval_samples_per_second": 159.484, |
| "step": 300 |
| }, |
| { |
| "epoch": 5.13, |
| "eval_accuracy": 80.43478260869566, |
| "eval_average_metrics": 80.43478260869566, |
| "eval_loss": 0.18479692935943604, |
| "eval_runtime": 0.7171, |
| "eval_samples_per_second": 192.431, |
| "step": 400 |
| }, |
| { |
| "epoch": 6.41, |
| "learning_rate": 0.00020384615384615385, |
| "loss": 0.2327, |
| "step": 500 |
| }, |
| { |
| "epoch": 6.41, |
| "eval_accuracy": 81.88405797101449, |
| "eval_average_metrics": 81.88405797101449, |
| "eval_loss": 0.23633617162704468, |
| "eval_runtime": 0.6787, |
| "eval_samples_per_second": 203.343, |
| "step": 500 |
| }, |
| { |
| "epoch": 7.69, |
| "eval_accuracy": 79.71014492753623, |
| "eval_average_metrics": 79.71014492753623, |
| "eval_loss": 0.23751917481422424, |
| "eval_runtime": 0.8803, |
| "eval_samples_per_second": 156.767, |
| "step": 600 |
| }, |
| { |
| "epoch": 8.97, |
| "eval_accuracy": 84.05797101449275, |
| "eval_average_metrics": 84.05797101449275, |
| "eval_loss": 0.23690848052501678, |
| "eval_runtime": 0.5629, |
| "eval_samples_per_second": 245.142, |
| "step": 700 |
| }, |
| { |
| "epoch": 10.26, |
| "eval_accuracy": 83.33333333333334, |
| "eval_average_metrics": 83.33333333333334, |
| "eval_loss": 0.2846378684043884, |
| "eval_runtime": 0.9472, |
| "eval_samples_per_second": 145.689, |
| "step": 800 |
| }, |
| { |
| "epoch": 11.54, |
| "eval_accuracy": 82.6086956521739, |
| "eval_average_metrics": 82.6086956521739, |
| "eval_loss": 0.2770601212978363, |
| "eval_runtime": 0.8799, |
| "eval_samples_per_second": 156.839, |
| "step": 900 |
| }, |
| { |
| "epoch": 12.82, |
| "learning_rate": 0.00010769230769230768, |
| "loss": 0.0774, |
| "step": 1000 |
| }, |
| { |
| "epoch": 12.82, |
| "eval_accuracy": 82.6086956521739, |
| "eval_average_metrics": 82.6086956521739, |
| "eval_loss": 0.3579100966453552, |
| "eval_runtime": 0.9343, |
| "eval_samples_per_second": 147.71, |
| "step": 1000 |
| }, |
| { |
| "epoch": 14.1, |
| "eval_accuracy": 81.15942028985508, |
| "eval_average_metrics": 81.15942028985508, |
| "eval_loss": 0.4031548798084259, |
| "eval_runtime": 0.6763, |
| "eval_samples_per_second": 204.046, |
| "step": 1100 |
| }, |
| { |
| "epoch": 15.38, |
| "eval_accuracy": 81.15942028985508, |
| "eval_average_metrics": 81.15942028985508, |
| "eval_loss": 0.4019993841648102, |
| "eval_runtime": 0.9288, |
| "eval_samples_per_second": 148.583, |
| "step": 1200 |
| }, |
| { |
| "epoch": 16.67, |
| "eval_accuracy": 78.98550724637681, |
| "eval_average_metrics": 78.98550724637681, |
| "eval_loss": 0.47033587098121643, |
| "eval_runtime": 0.6015, |
| "eval_samples_per_second": 229.417, |
| "step": 1300 |
| }, |
| { |
| "epoch": 17.95, |
| "eval_accuracy": 81.88405797101449, |
| "eval_average_metrics": 81.88405797101449, |
| "eval_loss": 0.4693973958492279, |
| "eval_runtime": 0.8377, |
| "eval_samples_per_second": 164.743, |
| "step": 1400 |
| }, |
| { |
| "epoch": 19.23, |
| "learning_rate": 1.1538461538461538e-05, |
| "loss": 0.0312, |
| "step": 1500 |
| }, |
| { |
| "epoch": 19.23, |
| "eval_accuracy": 79.71014492753623, |
| "eval_average_metrics": 79.71014492753623, |
| "eval_loss": 0.5053138136863708, |
| "eval_runtime": 1.053, |
| "eval_samples_per_second": 131.051, |
| "step": 1500 |
| }, |
| { |
| "epoch": 20.0, |
| "step": 1560, |
| "total_flos": 7649465032433664.0, |
| "train_loss": 0.1103338890350782, |
| "train_runtime": 529.9082, |
| "train_samples_per_second": 93.979, |
| "train_steps_per_second": 2.944 |
| } |
| ], |
| "max_steps": 1560, |
| "num_train_epochs": 20, |
| "total_flos": 7649465032433664.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|