| { | |
| "best_metric": 16.48035114189699, | |
| "best_model_checkpoint": "CHECKPOINTS/checkpoint-8", | |
| "epoch": 13.025, | |
| "eval_steps": 8, | |
| "global_step": 80, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.025, | |
| "eval_loss": 1.0526559352874756, | |
| "eval_runtime": 256.5611, | |
| "eval_samples_per_second": 0.873, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 16.48035114189699, | |
| "step": 8 | |
| }, | |
| { | |
| "epoch": 2.05, | |
| "eval_loss": 0.55241459608078, | |
| "eval_runtime": 257.8672, | |
| "eval_samples_per_second": 0.869, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 16.72038954804197, | |
| "step": 16 | |
| }, | |
| { | |
| "epoch": 3.075, | |
| "eval_loss": 0.4660560190677643, | |
| "eval_runtime": 258.0886, | |
| "eval_samples_per_second": 0.868, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 18.23606062684315, | |
| "step": 24 | |
| }, | |
| { | |
| "epoch": 5.025, | |
| "eval_loss": 0.41761377453804016, | |
| "eval_runtime": 270.1611, | |
| "eval_samples_per_second": 0.829, | |
| "eval_steps_per_second": 0.007, | |
| "eval_wer": 21.301693985323368, | |
| "step": 32 | |
| }, | |
| { | |
| "epoch": 6.05, | |
| "eval_loss": 0.4736975133419037, | |
| "eval_runtime": 287.4266, | |
| "eval_samples_per_second": 0.779, | |
| "eval_steps_per_second": 0.007, | |
| "eval_wer": 31.82909265482477, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 7.075, | |
| "eval_loss": 0.4601687788963318, | |
| "eval_runtime": 256.8801, | |
| "eval_samples_per_second": 0.872, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 17.399355325423496, | |
| "step": 48 | |
| }, | |
| { | |
| "epoch": 9.025, | |
| "eval_loss": 0.45703616738319397, | |
| "eval_runtime": 256.3162, | |
| "eval_samples_per_second": 0.874, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 18.105754063507305, | |
| "step": 56 | |
| }, | |
| { | |
| "epoch": 10.05, | |
| "eval_loss": 0.4644158184528351, | |
| "eval_runtime": 256.0296, | |
| "eval_samples_per_second": 0.875, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 18.318359508950003, | |
| "step": 64 | |
| }, | |
| { | |
| "epoch": 11.075, | |
| "eval_loss": 0.46031108498573303, | |
| "eval_runtime": 256.8198, | |
| "eval_samples_per_second": 0.872, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 18.215485906316438, | |
| "step": 72 | |
| }, | |
| { | |
| "epoch": 13.025, | |
| "eval_loss": 0.4596288502216339, | |
| "eval_runtime": 254.7423, | |
| "eval_samples_per_second": 0.879, | |
| "eval_steps_per_second": 0.008, | |
| "eval_wer": 18.14690350456073, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 13.025, | |
| "step": 80, | |
| "total_flos": 3.4790381338471956e+19, | |
| "train_loss": 0.15404987335205078, | |
| "train_runtime": 3979.2182, | |
| "train_samples_per_second": 2.573, | |
| "train_steps_per_second": 0.02 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 80, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 9223372036854775807, | |
| "save_steps": 8, | |
| "total_flos": 3.4790381338471956e+19, | |
| "train_batch_size": 32, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |