| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 2.803738317757009, | |
| "global_step": 300, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.93, | |
| "learning_rate": 0.00020654205607476632, | |
| "loss": 2.3489, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_loss": 1.9349576234817505, | |
| "eval_rouge1": 0.39386190784575437, | |
| "eval_rouge2": 0.2517830958048599, | |
| "eval_rougeL": 0.34926703865997477, | |
| "eval_rougeLsum": 0.3558229004695481, | |
| "eval_runtime": 113.9089, | |
| "eval_samples_per_second": 2.493, | |
| "eval_steps_per_second": 0.623, | |
| "step": 107 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "learning_rate": 0.00011308411214953269, | |
| "loss": 1.8838, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_loss": 1.8483030796051025, | |
| "eval_rouge1": 0.40113136486018286, | |
| "eval_rouge2": 0.25896861252154124, | |
| "eval_rougeL": 0.3557696923144424, | |
| "eval_rougeLsum": 0.3624647104286536, | |
| "eval_runtime": 124.5217, | |
| "eval_samples_per_second": 2.281, | |
| "eval_steps_per_second": 0.57, | |
| "step": 214 | |
| }, | |
| { | |
| "epoch": 2.8, | |
| "learning_rate": 1.9626168224299062e-05, | |
| "loss": 1.686, | |
| "step": 300 | |
| } | |
| ], | |
| "max_steps": 321, | |
| "num_train_epochs": 3, | |
| "total_flos": 111492406112256.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |