| { |
| "best_metric": 100.44140975239672, |
| "best_model_checkpoint": "./whisper-medium-sw/checkpoint-1000", |
| "epoch": 0.8684324793747286, |
| "global_step": 2000, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.01, |
| "learning_rate": 4.4e-07, |
| "loss": 3.9918, |
| "step": 25 |
| }, |
| { |
| "epoch": 0.02, |
| "learning_rate": 9.400000000000001e-07, |
| "loss": 2.9378, |
| "step": 50 |
| }, |
| { |
| "epoch": 0.03, |
| "learning_rate": 1.44e-06, |
| "loss": 2.2426, |
| "step": 75 |
| }, |
| { |
| "epoch": 0.04, |
| "learning_rate": 1.94e-06, |
| "loss": 1.9092, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.05, |
| "learning_rate": 2.4400000000000004e-06, |
| "loss": 1.5559, |
| "step": 125 |
| }, |
| { |
| "epoch": 0.07, |
| "learning_rate": 2.9400000000000002e-06, |
| "loss": 1.3102, |
| "step": 150 |
| }, |
| { |
| "epoch": 0.08, |
| "learning_rate": 3.44e-06, |
| "loss": 0.8516, |
| "step": 175 |
| }, |
| { |
| "epoch": 0.09, |
| "learning_rate": 3.94e-06, |
| "loss": 0.7099, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.1, |
| "learning_rate": 4.440000000000001e-06, |
| "loss": 0.6525, |
| "step": 225 |
| }, |
| { |
| "epoch": 0.11, |
| "learning_rate": 4.94e-06, |
| "loss": 0.6032, |
| "step": 250 |
| }, |
| { |
| "epoch": 0.12, |
| "learning_rate": 5.4400000000000004e-06, |
| "loss": 0.6283, |
| "step": 275 |
| }, |
| { |
| "epoch": 0.13, |
| "learning_rate": 5.94e-06, |
| "loss": 0.5585, |
| "step": 300 |
| }, |
| { |
| "epoch": 0.14, |
| "learning_rate": 6.440000000000001e-06, |
| "loss": 0.5346, |
| "step": 325 |
| }, |
| { |
| "epoch": 0.15, |
| "learning_rate": 6.9400000000000005e-06, |
| "loss": 0.5352, |
| "step": 350 |
| }, |
| { |
| "epoch": 0.16, |
| "learning_rate": 7.440000000000001e-06, |
| "loss": 0.477, |
| "step": 375 |
| }, |
| { |
| "epoch": 0.17, |
| "learning_rate": 7.94e-06, |
| "loss": 0.4809, |
| "step": 400 |
| }, |
| { |
| "epoch": 0.18, |
| "learning_rate": 8.44e-06, |
| "loss": 0.4502, |
| "step": 425 |
| }, |
| { |
| "epoch": 0.2, |
| "learning_rate": 8.94e-06, |
| "loss": 0.479, |
| "step": 450 |
| }, |
| { |
| "epoch": 0.21, |
| "learning_rate": 9.440000000000001e-06, |
| "loss": 0.4514, |
| "step": 475 |
| }, |
| { |
| "epoch": 0.22, |
| "learning_rate": 9.940000000000001e-06, |
| "loss": 0.477, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.23, |
| "learning_rate": 9.937142857142858e-06, |
| "loss": 0.473, |
| "step": 525 |
| }, |
| { |
| "epoch": 0.24, |
| "learning_rate": 9.865714285714285e-06, |
| "loss": 0.4485, |
| "step": 550 |
| }, |
| { |
| "epoch": 0.25, |
| "learning_rate": 9.794285714285714e-06, |
| "loss": 0.4196, |
| "step": 575 |
| }, |
| { |
| "epoch": 0.26, |
| "learning_rate": 9.722857142857143e-06, |
| "loss": 0.4217, |
| "step": 600 |
| }, |
| { |
| "epoch": 0.27, |
| "learning_rate": 9.651428571428572e-06, |
| "loss": 0.4061, |
| "step": 625 |
| }, |
| { |
| "epoch": 0.28, |
| "learning_rate": 9.58e-06, |
| "loss": 0.4141, |
| "step": 650 |
| }, |
| { |
| "epoch": 0.29, |
| "learning_rate": 9.508571428571429e-06, |
| "loss": 0.4025, |
| "step": 675 |
| }, |
| { |
| "epoch": 0.3, |
| "learning_rate": 9.437142857142858e-06, |
| "loss": 0.4048, |
| "step": 700 |
| }, |
| { |
| "epoch": 0.31, |
| "learning_rate": 9.365714285714287e-06, |
| "loss": 0.3943, |
| "step": 725 |
| }, |
| { |
| "epoch": 0.33, |
| "learning_rate": 9.294285714285714e-06, |
| "loss": 0.3922, |
| "step": 750 |
| }, |
| { |
| "epoch": 0.34, |
| "learning_rate": 9.222857142857143e-06, |
| "loss": 0.3607, |
| "step": 775 |
| }, |
| { |
| "epoch": 0.35, |
| "learning_rate": 9.151428571428572e-06, |
| "loss": 0.3546, |
| "step": 800 |
| }, |
| { |
| "epoch": 0.36, |
| "learning_rate": 9.080000000000001e-06, |
| "loss": 0.3907, |
| "step": 825 |
| }, |
| { |
| "epoch": 0.37, |
| "learning_rate": 9.00857142857143e-06, |
| "loss": 0.365, |
| "step": 850 |
| }, |
| { |
| "epoch": 0.38, |
| "learning_rate": 8.937142857142857e-06, |
| "loss": 0.3411, |
| "step": 875 |
| }, |
| { |
| "epoch": 0.39, |
| "learning_rate": 8.865714285714287e-06, |
| "loss": 0.3741, |
| "step": 900 |
| }, |
| { |
| "epoch": 0.4, |
| "learning_rate": 8.794285714285716e-06, |
| "loss": 0.3313, |
| "step": 925 |
| }, |
| { |
| "epoch": 0.41, |
| "learning_rate": 8.722857142857145e-06, |
| "loss": 0.3643, |
| "step": 950 |
| }, |
| { |
| "epoch": 0.42, |
| "learning_rate": 8.651428571428572e-06, |
| "loss": 0.3341, |
| "step": 975 |
| }, |
| { |
| "epoch": 0.43, |
| "learning_rate": 8.580000000000001e-06, |
| "loss": 0.3495, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_loss": 0.45124879479408264, |
| "eval_runtime": 3578.9421, |
| "eval_samples_per_second": 2.861, |
| "eval_steps_per_second": 0.358, |
| "eval_wer": 100.44140975239672, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.45, |
| "learning_rate": 8.50857142857143e-06, |
| "loss": 0.346, |
| "step": 1025 |
| }, |
| { |
| "epoch": 0.46, |
| "learning_rate": 8.437142857142859e-06, |
| "loss": 0.3359, |
| "step": 1050 |
| }, |
| { |
| "epoch": 0.47, |
| "learning_rate": 8.365714285714286e-06, |
| "loss": 0.3108, |
| "step": 1075 |
| }, |
| { |
| "epoch": 0.48, |
| "learning_rate": 8.294285714285715e-06, |
| "loss": 0.3253, |
| "step": 1100 |
| }, |
| { |
| "epoch": 0.49, |
| "learning_rate": 8.222857142857144e-06, |
| "loss": 0.3359, |
| "step": 1125 |
| }, |
| { |
| "epoch": 0.5, |
| "learning_rate": 8.151428571428572e-06, |
| "loss": 0.3005, |
| "step": 1150 |
| }, |
| { |
| "epoch": 0.51, |
| "learning_rate": 8.08e-06, |
| "loss": 0.2959, |
| "step": 1175 |
| }, |
| { |
| "epoch": 0.52, |
| "learning_rate": 8.00857142857143e-06, |
| "loss": 0.3158, |
| "step": 1200 |
| }, |
| { |
| "epoch": 0.53, |
| "learning_rate": 7.937142857142857e-06, |
| "loss": 0.3128, |
| "step": 1225 |
| }, |
| { |
| "epoch": 0.54, |
| "learning_rate": 7.865714285714286e-06, |
| "loss": 0.2948, |
| "step": 1250 |
| }, |
| { |
| "epoch": 0.55, |
| "learning_rate": 7.794285714285715e-06, |
| "loss": 0.3347, |
| "step": 1275 |
| }, |
| { |
| "epoch": 0.56, |
| "learning_rate": 7.722857142857142e-06, |
| "loss": 0.3128, |
| "step": 1300 |
| }, |
| { |
| "epoch": 0.58, |
| "learning_rate": 7.651428571428571e-06, |
| "loss": 0.3195, |
| "step": 1325 |
| }, |
| { |
| "epoch": 0.59, |
| "learning_rate": 7.58e-06, |
| "loss": 0.3079, |
| "step": 1350 |
| }, |
| { |
| "epoch": 0.6, |
| "learning_rate": 7.508571428571429e-06, |
| "loss": 0.2939, |
| "step": 1375 |
| }, |
| { |
| "epoch": 0.61, |
| "learning_rate": 7.4371428571428575e-06, |
| "loss": 0.288, |
| "step": 1400 |
| }, |
| { |
| "epoch": 0.62, |
| "learning_rate": 7.365714285714286e-06, |
| "loss": 0.2863, |
| "step": 1425 |
| }, |
| { |
| "epoch": 0.63, |
| "learning_rate": 7.294285714285715e-06, |
| "loss": 0.3064, |
| "step": 1450 |
| }, |
| { |
| "epoch": 0.64, |
| "learning_rate": 7.222857142857144e-06, |
| "loss": 0.2752, |
| "step": 1475 |
| }, |
| { |
| "epoch": 0.65, |
| "learning_rate": 7.151428571428573e-06, |
| "loss": 0.299, |
| "step": 1500 |
| }, |
| { |
| "epoch": 0.66, |
| "learning_rate": 7.08e-06, |
| "loss": 0.2867, |
| "step": 1525 |
| }, |
| { |
| "epoch": 0.67, |
| "learning_rate": 7.008571428571429e-06, |
| "loss": 0.2622, |
| "step": 1550 |
| }, |
| { |
| "epoch": 0.68, |
| "learning_rate": 6.937142857142858e-06, |
| "loss": 0.2844, |
| "step": 1575 |
| }, |
| { |
| "epoch": 0.69, |
| "learning_rate": 6.865714285714287e-06, |
| "loss": 0.2897, |
| "step": 1600 |
| }, |
| { |
| "epoch": 0.71, |
| "learning_rate": 6.794285714285714e-06, |
| "loss": 0.2833, |
| "step": 1625 |
| }, |
| { |
| "epoch": 0.72, |
| "learning_rate": 6.722857142857143e-06, |
| "loss": 0.3021, |
| "step": 1650 |
| }, |
| { |
| "epoch": 0.73, |
| "learning_rate": 6.651428571428572e-06, |
| "loss": 0.2912, |
| "step": 1675 |
| }, |
| { |
| "epoch": 0.74, |
| "learning_rate": 6.5800000000000005e-06, |
| "loss": 0.2884, |
| "step": 1700 |
| }, |
| { |
| "epoch": 0.75, |
| "learning_rate": 6.5085714285714295e-06, |
| "loss": 0.2705, |
| "step": 1725 |
| }, |
| { |
| "epoch": 0.76, |
| "learning_rate": 6.437142857142858e-06, |
| "loss": 0.2626, |
| "step": 1750 |
| }, |
| { |
| "epoch": 0.77, |
| "learning_rate": 6.365714285714286e-06, |
| "loss": 0.2974, |
| "step": 1775 |
| }, |
| { |
| "epoch": 0.78, |
| "learning_rate": 6.294285714285715e-06, |
| "loss": 0.2678, |
| "step": 1800 |
| }, |
| { |
| "epoch": 0.79, |
| "learning_rate": 6.222857142857144e-06, |
| "loss": 0.2712, |
| "step": 1825 |
| }, |
| { |
| "epoch": 0.8, |
| "learning_rate": 6.151428571428571e-06, |
| "loss": 0.2733, |
| "step": 1850 |
| }, |
| { |
| "epoch": 0.81, |
| "learning_rate": 6.08e-06, |
| "loss": 0.2598, |
| "step": 1875 |
| }, |
| { |
| "epoch": 0.83, |
| "learning_rate": 6.008571428571429e-06, |
| "loss": 0.2905, |
| "step": 1900 |
| }, |
| { |
| "epoch": 0.84, |
| "learning_rate": 5.937142857142858e-06, |
| "loss": 0.272, |
| "step": 1925 |
| }, |
| { |
| "epoch": 0.85, |
| "learning_rate": 5.865714285714286e-06, |
| "loss": 0.2674, |
| "step": 1950 |
| }, |
| { |
| "epoch": 0.86, |
| "learning_rate": 5.794285714285715e-06, |
| "loss": 0.2659, |
| "step": 1975 |
| }, |
| { |
| "epoch": 0.87, |
| "learning_rate": 5.722857142857144e-06, |
| "loss": 0.2634, |
| "step": 2000 |
| }, |
| { |
| "epoch": 0.87, |
| "eval_loss": 0.3813508152961731, |
| "eval_runtime": 3665.2487, |
| "eval_samples_per_second": 2.793, |
| "eval_steps_per_second": 0.349, |
| "eval_wer": 101.54493413338852, |
| "step": 2000 |
| } |
| ], |
| "max_steps": 4000, |
| "num_train_epochs": 2, |
| "total_flos": 3.265935704064e+19, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|