whisper-small-me / trainer_state.json
razhan's picture
End of training
29f66d8
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 410,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.24390243902439024,
"grad_norm": 23.37420654296875,
"learning_rate": 1.5e-06,
"loss": 3.2045,
"step": 20
},
{
"epoch": 0.4878048780487805,
"grad_norm": 11.02387809753418,
"learning_rate": 3.5e-06,
"loss": 2.0765,
"step": 40
},
{
"epoch": 0.7317073170731707,
"grad_norm": 4.315557479858398,
"learning_rate": 5.500000000000001e-06,
"loss": 1.1171,
"step": 60
},
{
"epoch": 0.975609756097561,
"grad_norm": 3.7738795280456543,
"learning_rate": 7.500000000000001e-06,
"loss": 0.6946,
"step": 80
},
{
"epoch": 1.0,
"eval_avg_cer": 0.38252571063317314,
"eval_avg_wer": 0.8156832493942604,
"eval_gilaki_cer": 0.37511361177234365,
"eval_gilaki_wer": 0.9556110684089162,
"eval_hawrami_cer": 0.11549464078794902,
"eval_hawrami_wer": 0.5245801526717557,
"eval_laki_kurdish_cer": 0.2733040507564666,
"eval_laki_kurdish_wer": 0.7938650306748466,
"eval_loss": 0.766200602054596,
"eval_mazanderani_cer": 0.32235210768685796,
"eval_mazanderani_wer": 0.8120224146714213,
"eval_runtime": 281.2263,
"eval_samples_per_second": 11.585,
"eval_southern_kurdish_cer": 0.2192075497883561,
"eval_southern_kurdish_wer": 0.6800766283524904,
"eval_steps_per_second": 0.046,
"eval_talysh_cer": 0.3333333333333333,
"eval_talysh_wer": 0.9166666666666666,
"eval_zazaki_cer": 1.0388746803069053,
"eval_zazaki_wer": 1.0269607843137254,
"step": 82
},
{
"epoch": 1.2195121951219512,
"grad_norm": 2.4077467918395996,
"learning_rate": 9.5e-06,
"loss": 0.5333,
"step": 100
},
{
"epoch": 1.4634146341463414,
"grad_norm": 2.5292022228240967,
"learning_rate": 9.516129032258065e-06,
"loss": 0.4533,
"step": 120
},
{
"epoch": 1.7073170731707317,
"grad_norm": 2.2705225944519043,
"learning_rate": 8.870967741935484e-06,
"loss": 0.4231,
"step": 140
},
{
"epoch": 1.951219512195122,
"grad_norm": 2.4976840019226074,
"learning_rate": 8.225806451612904e-06,
"loss": 0.3864,
"step": 160
},
{
"epoch": 2.0,
"eval_avg_cer": 0.24537730055466347,
"eval_avg_wer": 0.686525530003659,
"eval_gilaki_cer": 0.34542306859987015,
"eval_gilaki_wer": 0.9579169869331283,
"eval_hawrami_cer": 0.07734646581691773,
"eval_hawrami_wer": 0.380559796437659,
"eval_laki_kurdish_cer": 0.15470961444607126,
"eval_laki_kurdish_wer": 0.5644171779141104,
"eval_loss": 0.5171846747398376,
"eval_mazanderani_cer": 0.18455543747786043,
"eval_mazanderani_wer": 0.609271523178808,
"eval_runtime": 283.0635,
"eval_samples_per_second": 11.51,
"eval_southern_kurdish_cer": 0.1742765942682673,
"eval_southern_kurdish_wer": 0.5484151863462209,
"eval_steps_per_second": 0.046,
"eval_talysh_cer": 0.5,
"eval_talysh_wer": 1.0,
"eval_zazaki_cer": 0.2813299232736573,
"eval_zazaki_wer": 0.7450980392156863,
"step": 164
},
{
"epoch": 2.1951219512195124,
"grad_norm": 2.0281219482421875,
"learning_rate": 7.580645161290323e-06,
"loss": 0.3523,
"step": 180
},
{
"epoch": 2.4390243902439024,
"grad_norm": 2.4135963916778564,
"learning_rate": 6.935483870967743e-06,
"loss": 0.3342,
"step": 200
},
{
"epoch": 2.682926829268293,
"grad_norm": 2.4130258560180664,
"learning_rate": 6.290322580645162e-06,
"loss": 0.3199,
"step": 220
},
{
"epoch": 2.926829268292683,
"grad_norm": 1.6657346487045288,
"learning_rate": 5.645161290322582e-06,
"loss": 0.3234,
"step": 240
},
{
"epoch": 3.0,
"eval_avg_cer": 0.2326738623090893,
"eval_avg_wer": 0.6506993324980173,
"eval_gilaki_cer": 0.35135252109932913,
"eval_gilaki_wer": 0.9632974634896234,
"eval_hawrami_cer": 0.07220451911935111,
"eval_hawrami_wer": 0.3532824427480916,
"eval_laki_kurdish_cer": 0.13624532292175046,
"eval_laki_kurdish_wer": 0.5231083844580777,
"eval_loss": 0.4686383008956909,
"eval_mazanderani_cer": 0.16519069547762427,
"eval_mazanderani_wer": 0.5476311767702496,
"eval_runtime": 284.8477,
"eval_samples_per_second": 11.438,
"eval_southern_kurdish_cer": 0.16740684199569772,
"eval_southern_kurdish_wer": 0.4935562521769418,
"eval_steps_per_second": 0.046,
"eval_talysh_cer": 0.5,
"eval_talysh_wer": 1.0,
"eval_zazaki_cer": 0.23631713554987213,
"eval_zazaki_wer": 0.6740196078431373,
"step": 246
},
{
"epoch": 3.1707317073170733,
"grad_norm": 1.7249436378479004,
"learning_rate": 5e-06,
"loss": 0.299,
"step": 260
},
{
"epoch": 3.4146341463414633,
"grad_norm": 1.6258125305175781,
"learning_rate": 4.35483870967742e-06,
"loss": 0.2806,
"step": 280
},
{
"epoch": 3.658536585365854,
"grad_norm": 1.9203271865844727,
"learning_rate": 3.7096774193548392e-06,
"loss": 0.2753,
"step": 300
},
{
"epoch": 3.902439024390244,
"grad_norm": 1.7945189476013184,
"learning_rate": 3.0645161290322584e-06,
"loss": 0.2786,
"step": 320
},
{
"epoch": 4.0,
"eval_avg_cer": 0.2249207301185327,
"eval_avg_wer": 0.632319681761422,
"eval_gilaki_cer": 0.3179398398615018,
"eval_gilaki_wer": 0.9083397386625672,
"eval_hawrami_cer": 0.07321842410196987,
"eval_hawrami_wer": 0.34849872773536894,
"eval_laki_kurdish_cer": 0.1333984057263706,
"eval_laki_kurdish_wer": 0.5047034764826176,
"eval_loss": 0.4527292251586914,
"eval_mazanderani_cer": 0.1596410438068249,
"eval_mazanderani_wer": 0.5277636271013755,
"eval_runtime": 287.001,
"eval_samples_per_second": 11.352,
"eval_southern_kurdish_cer": 0.1769481645964888,
"eval_southern_kurdish_wer": 0.4947753396029258,
"eval_steps_per_second": 0.045,
"eval_talysh_cer": 0.5,
"eval_talysh_wer": 1.0,
"eval_zazaki_cer": 0.2132992327365729,
"eval_zazaki_wer": 0.6421568627450981,
"step": 328
},
{
"epoch": 4.146341463414634,
"grad_norm": 1.4399691820144653,
"learning_rate": 2.4193548387096776e-06,
"loss": 0.2609,
"step": 340
},
{
"epoch": 4.390243902439025,
"grad_norm": 1.4866726398468018,
"learning_rate": 1.774193548387097e-06,
"loss": 0.2484,
"step": 360
},
{
"epoch": 4.634146341463414,
"grad_norm": 1.4835667610168457,
"learning_rate": 1.1290322580645162e-06,
"loss": 0.2567,
"step": 380
},
{
"epoch": 4.878048780487805,
"grad_norm": 1.4296433925628662,
"learning_rate": 4.838709677419355e-07,
"loss": 0.2586,
"step": 400
},
{
"epoch": 5.0,
"eval_avg_cer": 0.2212028617810692,
"eval_avg_wer": 0.6295649617906507,
"eval_gilaki_cer": 0.3175070331097165,
"eval_gilaki_wer": 0.9175634127594159,
"eval_hawrami_cer": 0.07082850521436848,
"eval_hawrami_wer": 0.345852417302799,
"eval_laki_kurdish_cer": 0.12469497315763788,
"eval_laki_kurdish_wer": 0.49038854805725973,
"eval_loss": 0.45085304975509644,
"eval_mazanderani_cer": 0.16153028692879914,
"eval_mazanderani_wer": 0.5277636271013755,
"eval_runtime": 287.0262,
"eval_samples_per_second": 11.351,
"eval_southern_kurdish_cer": 0.17181319825133579,
"eval_southern_kurdish_wer": 0.4930337861372344,
"eval_steps_per_second": 0.045,
"eval_talysh_cer": 0.5,
"eval_talysh_wer": 1.0,
"eval_zazaki_cer": 0.2020460358056266,
"eval_zazaki_wer": 0.6323529411764706,
"step": 410
},
{
"epoch": 5.0,
"step": 410,
"total_flos": 3.028992382327587e+19,
"train_loss": 0.6099171120946,
"train_runtime": 8367.268,
"train_samples_per_second": 12.473,
"train_steps_per_second": 0.049
}
],
"logging_steps": 20,
"max_steps": 410,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 3.028992382327587e+19,
"train_batch_size": 128,
"trial_name": null,
"trial_params": null
}