| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 15.0, |
| "global_step": 1635, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.92, |
| "eval_loss": 3.606069326400757, |
| "eval_runtime": 74.9143, |
| "eval_samples_per_second": 21.985, |
| "eval_steps_per_second": 2.75, |
| "eval_wer": 1.0, |
| "step": 100 |
| }, |
| { |
| "epoch": 1.83, |
| "eval_loss": 3.0202510356903076, |
| "eval_runtime": 73.818, |
| "eval_samples_per_second": 22.312, |
| "eval_steps_per_second": 2.791, |
| "eval_wer": 0.9998978653865795, |
| "step": 200 |
| }, |
| { |
| "epoch": 2.75, |
| "eval_loss": 0.9479126930236816, |
| "eval_runtime": 73.9013, |
| "eval_samples_per_second": 22.286, |
| "eval_steps_per_second": 2.788, |
| "eval_wer": 0.791645388622204, |
| "step": 300 |
| }, |
| { |
| "epoch": 3.67, |
| "eval_loss": 0.6023567914962769, |
| "eval_runtime": 73.7383, |
| "eval_samples_per_second": 22.336, |
| "eval_steps_per_second": 2.794, |
| "eval_wer": 0.6285364109896844, |
| "step": 400 |
| }, |
| { |
| "epoch": 4.59, |
| "learning_rate": 0.0002988, |
| "loss": 3.1561, |
| "step": 500 |
| }, |
| { |
| "epoch": 4.59, |
| "eval_loss": 0.511204183101654, |
| "eval_runtime": 73.7804, |
| "eval_samples_per_second": 22.323, |
| "eval_steps_per_second": 2.792, |
| "eval_wer": 0.5369216627515064, |
| "step": 500 |
| }, |
| { |
| "epoch": 5.5, |
| "eval_loss": 0.45808982849121094, |
| "eval_runtime": 73.2344, |
| "eval_samples_per_second": 22.489, |
| "eval_steps_per_second": 2.813, |
| "eval_wer": 0.4900418751915024, |
| "step": 600 |
| }, |
| { |
| "epoch": 6.42, |
| "eval_loss": 0.43211525678634644, |
| "eval_runtime": 73.883, |
| "eval_samples_per_second": 22.292, |
| "eval_steps_per_second": 2.788, |
| "eval_wer": 0.4632826064753345, |
| "step": 700 |
| }, |
| { |
| "epoch": 7.34, |
| "eval_loss": 0.4252323508262634, |
| "eval_runtime": 73.1676, |
| "eval_samples_per_second": 22.51, |
| "eval_steps_per_second": 2.815, |
| "eval_wer": 0.43999591461546317, |
| "step": 800 |
| }, |
| { |
| "epoch": 8.26, |
| "eval_loss": 0.4203605055809021, |
| "eval_runtime": 73.3352, |
| "eval_samples_per_second": 22.459, |
| "eval_steps_per_second": 2.809, |
| "eval_wer": 0.4229394341742416, |
| "step": 900 |
| }, |
| { |
| "epoch": 9.17, |
| "learning_rate": 0.00016837004405286342, |
| "loss": 0.2247, |
| "step": 1000 |
| }, |
| { |
| "epoch": 9.17, |
| "eval_loss": 0.3948039710521698, |
| "eval_runtime": 73.35, |
| "eval_samples_per_second": 22.454, |
| "eval_steps_per_second": 2.808, |
| "eval_wer": 0.3970993769788581, |
| "step": 1000 |
| }, |
| { |
| "epoch": 10.09, |
| "eval_loss": 0.3996581435203552, |
| "eval_runtime": 73.0894, |
| "eval_samples_per_second": 22.534, |
| "eval_steps_per_second": 2.818, |
| "eval_wer": 0.39628230007149423, |
| "step": 1100 |
| }, |
| { |
| "epoch": 11.01, |
| "eval_loss": 0.4157370626926422, |
| "eval_runtime": 73.6448, |
| "eval_samples_per_second": 22.364, |
| "eval_steps_per_second": 2.797, |
| "eval_wer": 0.3894392809723215, |
| "step": 1200 |
| }, |
| { |
| "epoch": 11.93, |
| "eval_loss": 0.41419464349746704, |
| "eval_runtime": 72.7569, |
| "eval_samples_per_second": 22.637, |
| "eval_steps_per_second": 2.831, |
| "eval_wer": 0.38545603104892245, |
| "step": 1300 |
| }, |
| { |
| "epoch": 12.84, |
| "eval_loss": 0.4107553958892822, |
| "eval_runtime": 72.5948, |
| "eval_samples_per_second": 22.688, |
| "eval_steps_per_second": 2.838, |
| "eval_wer": 0.36380349300377895, |
| "step": 1400 |
| }, |
| { |
| "epoch": 13.76, |
| "learning_rate": 3.621145374449339e-05, |
| "loss": 0.1022, |
| "step": 1500 |
| }, |
| { |
| "epoch": 13.76, |
| "eval_loss": 0.3928930163383484, |
| "eval_runtime": 73.1498, |
| "eval_samples_per_second": 22.515, |
| "eval_steps_per_second": 2.816, |
| "eval_wer": 0.3617608007353692, |
| "step": 1500 |
| }, |
| { |
| "epoch": 14.68, |
| "eval_loss": 0.4004472494125366, |
| "eval_runtime": 72.6133, |
| "eval_samples_per_second": 22.682, |
| "eval_steps_per_second": 2.837, |
| "eval_wer": 0.3544071085690941, |
| "step": 1600 |
| }, |
| { |
| "epoch": 15.0, |
| "step": 1635, |
| "total_flos": 6.464559143942451e+18, |
| "train_loss": 1.071420776297193, |
| "train_runtime": 3969.9688, |
| "train_samples_per_second": 13.141, |
| "train_steps_per_second": 0.412 |
| } |
| ], |
| "max_steps": 1635, |
| "num_train_epochs": 15, |
| "total_flos": 6.464559143942451e+18, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|