| { |
| "best_metric": 0.18770882487297058, |
| "best_model_checkpoint": "./models/results_one_liners_453/checkpoint-225", |
| "epoch": 0.6489994591671173, |
| "global_step": 225, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.02, |
| "learning_rate": 4.000000000000001e-06, |
| "loss": 0.6902, |
| "step": 8 |
| }, |
| { |
| "epoch": 0.05, |
| "learning_rate": 8.000000000000001e-06, |
| "loss": 0.6955, |
| "step": 16 |
| }, |
| { |
| "epoch": 0.07, |
| "learning_rate": 1.2e-05, |
| "loss": 0.6911, |
| "step": 24 |
| }, |
| { |
| "epoch": 0.07, |
| "eval_accuracy": 0.49842271293375395, |
| "eval_f1": 0.6618460229689495, |
| "eval_loss": 0.6824508309364319, |
| "eval_precision": 0.494596312778131, |
| "eval_recall": 1.0, |
| "eval_runtime": 18.4237, |
| "eval_samples_per_second": 172.061, |
| "eval_steps_per_second": 21.548, |
| "step": 25 |
| }, |
| { |
| "epoch": 0.09, |
| "learning_rate": 1.6000000000000003e-05, |
| "loss": 0.674, |
| "step": 32 |
| }, |
| { |
| "epoch": 0.12, |
| "learning_rate": 2e-05, |
| "loss": 0.611, |
| "step": 40 |
| }, |
| { |
| "epoch": 0.14, |
| "learning_rate": 2.4e-05, |
| "loss": 0.4327, |
| "step": 48 |
| }, |
| { |
| "epoch": 0.14, |
| "eval_accuracy": 0.8712933753943217, |
| "eval_f1": 0.8696485623003196, |
| "eval_loss": 0.31961607933044434, |
| "eval_precision": 0.8646759847522236, |
| "eval_recall": 0.8746786632390745, |
| "eval_runtime": 18.2327, |
| "eval_samples_per_second": 173.864, |
| "eval_steps_per_second": 21.774, |
| "step": 50 |
| }, |
| { |
| "epoch": 0.16, |
| "learning_rate": 2.8000000000000003e-05, |
| "loss": 0.3598, |
| "step": 56 |
| }, |
| { |
| "epoch": 0.18, |
| "learning_rate": 3.2000000000000005e-05, |
| "loss": 0.392, |
| "step": 64 |
| }, |
| { |
| "epoch": 0.21, |
| "learning_rate": 3.6e-05, |
| "loss": 0.3812, |
| "step": 72 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_accuracy": 0.8914826498422713, |
| "eval_f1": 0.8940234134319162, |
| "eval_loss": 0.2683391869068146, |
| "eval_precision": 0.8585798816568048, |
| "eval_recall": 0.9325192802056556, |
| "eval_runtime": 18.1749, |
| "eval_samples_per_second": 174.416, |
| "eval_steps_per_second": 21.843, |
| "step": 75 |
| }, |
| { |
| "epoch": 0.23, |
| "learning_rate": 4e-05, |
| "loss": 0.3055, |
| "step": 80 |
| }, |
| { |
| "epoch": 0.25, |
| "learning_rate": 4.4000000000000006e-05, |
| "loss": 0.3159, |
| "step": 88 |
| }, |
| { |
| "epoch": 0.28, |
| "learning_rate": 4.8e-05, |
| "loss": 0.3093, |
| "step": 96 |
| }, |
| { |
| "epoch": 0.29, |
| "eval_accuracy": 0.9025236593059937, |
| "eval_f1": 0.896551724137931, |
| "eval_loss": 0.26234087347984314, |
| "eval_precision": 0.9357092941998603, |
| "eval_recall": 0.8605398457583547, |
| "eval_runtime": 18.2515, |
| "eval_samples_per_second": 173.684, |
| "eval_steps_per_second": 21.752, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.3, |
| "learning_rate": 4.9186991869918704e-05, |
| "loss": 0.3469, |
| "step": 104 |
| }, |
| { |
| "epoch": 0.32, |
| "learning_rate": 4.75609756097561e-05, |
| "loss": 0.3545, |
| "step": 112 |
| }, |
| { |
| "epoch": 0.35, |
| "learning_rate": 4.613821138211382e-05, |
| "loss": 0.3241, |
| "step": 120 |
| }, |
| { |
| "epoch": 0.36, |
| "eval_accuracy": 0.8858044164037855, |
| "eval_f1": 0.8927725118483413, |
| "eval_loss": 0.30523255467414856, |
| "eval_precision": 0.828021978021978, |
| "eval_recall": 0.968508997429306, |
| "eval_runtime": 18.1682, |
| "eval_samples_per_second": 174.481, |
| "eval_steps_per_second": 21.851, |
| "step": 125 |
| }, |
| { |
| "epoch": 0.37, |
| "learning_rate": 4.451219512195122e-05, |
| "loss": 0.2721, |
| "step": 128 |
| }, |
| { |
| "epoch": 0.39, |
| "learning_rate": 4.2886178861788616e-05, |
| "loss": 0.3343, |
| "step": 136 |
| }, |
| { |
| "epoch": 0.42, |
| "learning_rate": 4.126016260162602e-05, |
| "loss": 0.3455, |
| "step": 144 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_accuracy": 0.9141955835962146, |
| "eval_f1": 0.9128205128205129, |
| "eval_loss": 0.22679537534713745, |
| "eval_precision": 0.9104859335038363, |
| "eval_recall": 0.9151670951156813, |
| "eval_runtime": 18.2508, |
| "eval_samples_per_second": 173.691, |
| "eval_steps_per_second": 21.752, |
| "step": 150 |
| }, |
| { |
| "epoch": 0.44, |
| "learning_rate": 3.9634146341463416e-05, |
| "loss": 0.2462, |
| "step": 152 |
| }, |
| { |
| "epoch": 0.46, |
| "learning_rate": 3.800813008130081e-05, |
| "loss": 0.2843, |
| "step": 160 |
| }, |
| { |
| "epoch": 0.48, |
| "learning_rate": 3.6382113821138216e-05, |
| "loss": 0.1991, |
| "step": 168 |
| }, |
| { |
| "epoch": 0.5, |
| "eval_accuracy": 0.9170347003154574, |
| "eval_f1": 0.9147487844408428, |
| "eval_loss": 0.20860691368579865, |
| "eval_precision": 0.9228253760627861, |
| "eval_recall": 0.9068123393316195, |
| "eval_runtime": 18.2871, |
| "eval_samples_per_second": 173.346, |
| "eval_steps_per_second": 21.709, |
| "step": 175 |
| }, |
| { |
| "epoch": 0.51, |
| "learning_rate": 3.475609756097561e-05, |
| "loss": 0.276, |
| "step": 176 |
| }, |
| { |
| "epoch": 0.53, |
| "learning_rate": 3.313008130081301e-05, |
| "loss": 0.2483, |
| "step": 184 |
| }, |
| { |
| "epoch": 0.55, |
| "learning_rate": 3.150406504065041e-05, |
| "loss": 0.2568, |
| "step": 192 |
| }, |
| { |
| "epoch": 0.58, |
| "learning_rate": 2.9878048780487805e-05, |
| "loss": 0.227, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.58, |
| "eval_accuracy": 0.9198738170347003, |
| "eval_f1": 0.9166666666666666, |
| "eval_loss": 0.20122328400611877, |
| "eval_precision": 0.9363270777479893, |
| "eval_recall": 0.8978149100257069, |
| "eval_runtime": 18.2795, |
| "eval_samples_per_second": 173.418, |
| "eval_steps_per_second": 21.718, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.6, |
| "learning_rate": 2.8252032520325205e-05, |
| "loss": 0.2167, |
| "step": 208 |
| }, |
| { |
| "epoch": 0.62, |
| "learning_rate": 2.66260162601626e-05, |
| "loss": 0.2033, |
| "step": 216 |
| }, |
| { |
| "epoch": 0.65, |
| "learning_rate": 2.5e-05, |
| "loss": 0.2357, |
| "step": 224 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_accuracy": 0.9261829652996846, |
| "eval_f1": 0.9254302103250478, |
| "eval_loss": 0.18770882487297058, |
| "eval_precision": 0.9178255372945638, |
| "eval_recall": 0.9331619537275064, |
| "eval_runtime": 18.2243, |
| "eval_samples_per_second": 173.943, |
| "eval_steps_per_second": 21.784, |
| "step": 225 |
| } |
| ], |
| "max_steps": 346, |
| "num_train_epochs": 1, |
| "total_flos": 429199909056000.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|