| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 0.4686523640908144, | |
| "global_step": 4500, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.05, | |
| "learning_rate": 2.947927515101021e-05, | |
| "loss": 2.2374, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.05, | |
| "eval_exact_match": 49.46965745087811, | |
| "eval_f1": 54.705922468625346, | |
| "eval_loss": 1.399248480796814, | |
| "eval_runtime": 152.8082, | |
| "eval_samples_per_second": 92.96, | |
| "eval_steps_per_second": 11.622, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "learning_rate": 2.8958550302020413e-05, | |
| "loss": 1.1963, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_exact_match": 54.33837593462007, | |
| "eval_f1": 59.335692166319255, | |
| "eval_loss": 1.046236276626587, | |
| "eval_runtime": 153.237, | |
| "eval_samples_per_second": 92.7, | |
| "eval_steps_per_second": 11.59, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "learning_rate": 2.8437825453030617e-05, | |
| "loss": 1.1031, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "eval_exact_match": 56.17283950617284, | |
| "eval_f1": 61.40430603082631, | |
| "eval_loss": 0.8644341230392456, | |
| "eval_runtime": 153.7515, | |
| "eval_samples_per_second": 92.389, | |
| "eval_steps_per_second": 11.551, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.21, | |
| "learning_rate": 2.7917100604040825e-05, | |
| "loss": 0.9479, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.21, | |
| "eval_exact_match": 57.21613632411754, | |
| "eval_f1": 61.625922292628005, | |
| "eval_loss": 0.7944296002388, | |
| "eval_runtime": 153.833, | |
| "eval_samples_per_second": 92.34, | |
| "eval_steps_per_second": 11.545, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "learning_rate": 2.7396375755051033e-05, | |
| "loss": 0.899, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "eval_exact_match": 59.867849069727, | |
| "eval_f1": 64.17727571949499, | |
| "eval_loss": 0.7857800722122192, | |
| "eval_runtime": 154.1204, | |
| "eval_samples_per_second": 92.168, | |
| "eval_steps_per_second": 11.523, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "learning_rate": 2.6875650906061238e-05, | |
| "loss": 0.8672, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "eval_exact_match": 65.00608589810467, | |
| "eval_f1": 69.60946105310353, | |
| "eval_loss": 0.8072792887687683, | |
| "eval_runtime": 154.2464, | |
| "eval_samples_per_second": 92.093, | |
| "eval_steps_per_second": 11.514, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "learning_rate": 2.6354926057071445e-05, | |
| "loss": 0.8375, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "eval_exact_match": 63.82368283776734, | |
| "eval_f1": 68.19581427410363, | |
| "eval_loss": 0.7115561366081238, | |
| "eval_runtime": 154.7006, | |
| "eval_samples_per_second": 91.822, | |
| "eval_steps_per_second": 11.48, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "learning_rate": 2.583420120808165e-05, | |
| "loss": 0.8454, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "eval_exact_match": 65.8320292123109, | |
| "eval_f1": 70.26703931597173, | |
| "eval_loss": 0.6987438201904297, | |
| "eval_runtime": 154.6403, | |
| "eval_samples_per_second": 91.858, | |
| "eval_steps_per_second": 11.485, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "learning_rate": 2.5313476359091858e-05, | |
| "loss": 0.8031, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "eval_exact_match": 62.44131455399061, | |
| "eval_f1": 66.50570614180938, | |
| "eval_loss": 0.6731235980987549, | |
| "eval_runtime": 154.5393, | |
| "eval_samples_per_second": 91.918, | |
| "eval_steps_per_second": 11.492, | |
| "step": 4500 | |
| } | |
| ], | |
| "max_steps": 28806, | |
| "num_train_epochs": 3, | |
| "total_flos": 9406683242496000.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |