| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 0.5266468686454935, |
| "global_step": 4500, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.06, |
| "learning_rate": 0.00015, |
| "loss": 2.5393, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.06, |
| "eval_loss": 0.4428945779800415, |
| "eval_phone_accuracy": 0.9003876271495096, |
| "eval_runtime": 16.8778, |
| "eval_samples_per_second": 11.85, |
| "eval_steps_per_second": 2.962, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.12, |
| "learning_rate": 0.0003, |
| "loss": 0.4474, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.12, |
| "eval_loss": 0.2071739137172699, |
| "eval_phone_accuracy": 0.9347190787134594, |
| "eval_runtime": 15.9974, |
| "eval_samples_per_second": 12.502, |
| "eval_steps_per_second": 3.126, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.18, |
| "learning_rate": 0.00028011664899257687, |
| "loss": 0.3105, |
| "step": 1500 |
| }, |
| { |
| "epoch": 0.18, |
| "eval_loss": 0.174857959151268, |
| "eval_phone_accuracy": 0.94312200282699, |
| "eval_runtime": 16.5779, |
| "eval_samples_per_second": 12.064, |
| "eval_steps_per_second": 3.016, |
| "step": 1500 |
| }, |
| { |
| "epoch": 0.23, |
| "learning_rate": 0.0002602332979851537, |
| "loss": 0.2682, |
| "step": 2000 |
| }, |
| { |
| "epoch": 0.23, |
| "eval_loss": 0.16749557852745056, |
| "eval_phone_accuracy": 0.9447956502510471, |
| "eval_runtime": 15.1084, |
| "eval_samples_per_second": 13.238, |
| "eval_steps_per_second": 3.309, |
| "step": 2000 |
| }, |
| { |
| "epoch": 0.29, |
| "learning_rate": 0.0002403499469777306, |
| "loss": 0.2467, |
| "step": 2500 |
| }, |
| { |
| "epoch": 0.29, |
| "eval_loss": 0.15832921862602234, |
| "eval_phone_accuracy": 0.9478567774048926, |
| "eval_runtime": 14.9641, |
| "eval_samples_per_second": 13.365, |
| "eval_steps_per_second": 3.341, |
| "step": 2500 |
| }, |
| { |
| "epoch": 0.35, |
| "learning_rate": 0.00022046659597030753, |
| "loss": 0.2324, |
| "step": 3000 |
| }, |
| { |
| "epoch": 0.35, |
| "eval_loss": 0.14310674369335175, |
| "eval_phone_accuracy": 0.949885966509708, |
| "eval_runtime": 15.0339, |
| "eval_samples_per_second": 13.303, |
| "eval_steps_per_second": 3.326, |
| "step": 3000 |
| }, |
| { |
| "epoch": 0.41, |
| "learning_rate": 0.0002005832449628844, |
| "loss": 0.22, |
| "step": 3500 |
| }, |
| { |
| "epoch": 0.41, |
| "eval_loss": 0.13784204423427582, |
| "eval_phone_accuracy": 0.9521579645672364, |
| "eval_runtime": 16.1699, |
| "eval_samples_per_second": 12.369, |
| "eval_steps_per_second": 3.092, |
| "step": 3500 |
| }, |
| { |
| "epoch": 0.47, |
| "learning_rate": 0.0001806998939554613, |
| "loss": 0.2109, |
| "step": 4000 |
| }, |
| { |
| "epoch": 0.47, |
| "eval_loss": 0.1341935396194458, |
| "eval_phone_accuracy": 0.9543519168899642, |
| "eval_runtime": 15.6229, |
| "eval_samples_per_second": 12.802, |
| "eval_steps_per_second": 3.2, |
| "step": 4000 |
| }, |
| { |
| "epoch": 0.53, |
| "learning_rate": 0.00016081654294803816, |
| "loss": 0.2039, |
| "step": 4500 |
| }, |
| { |
| "epoch": 0.53, |
| "eval_loss": 0.13459673523902893, |
| "eval_phone_accuracy": 0.9526435824726623, |
| "eval_runtime": 15.5354, |
| "eval_samples_per_second": 12.874, |
| "eval_steps_per_second": 3.218, |
| "step": 4500 |
| } |
| ], |
| "max_steps": 8544, |
| "num_train_epochs": 1, |
| "total_flos": 7.300030651149006e+19, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|