End of training

Browse files

Files changed (5) hide show

README.md +15 -2
all_results.json +15 -0
eval_results.json +9 -0
train_results.json +9 -0
trainer_state.json +621 -0

README.md CHANGED Viewed

@@ -4,11 +4,24 @@ license: apache-2.0
 base_model: openai/whisper-medium
 tags:
 - generated_from_trainer
 metrics:
 - wer
 model-index:
 - name: whisper-medium-ph
-  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,7 +29,7 @@ should probably proofread and complete it, then remove this comment. -->
 # whisper-medium-ph
-This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on an unknown dataset.
 It achieves the following results on the evaluation set:
 - Loss: 0.3113
 - Wer: 0.1283

 base_model: openai/whisper-medium
 tags:
 - generated_from_trainer
+datasets:
+- rbcurzon/ph_dialect_asr
 metrics:
 - wer
 model-index:
 - name: whisper-medium-ph
+  results:
+  - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
+    dataset:
+      name: rbcurzon/ph_dialect_asr all
+      type: rbcurzon/ph_dialect_asr
+      args: all
+    metrics:
+    - name: Wer
+      type: wer
+      value: 0.12829864835872132
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # whisper-medium-ph
+This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on the rbcurzon/ph_dialect_asr all dataset.
 It achieves the following results on the evaluation set:
 - Loss: 0.3113
 - Wer: 0.1283

all_results.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+    "epoch": 2.466091245376079,
+    "eval_loss": 0.3112793266773224,
+    "eval_runtime": 1173.9261,
+    "eval_samples": 3612,
+    "eval_samples_per_second": 3.077,
+    "eval_steps_per_second": 0.193,
+    "eval_wer": 0.12829864835872132,
+    "total_flos": 3.265323341119488e+19,
+    "train_loss": 0.2021937195956707,
+    "train_runtime": 9527.7148,
+    "train_samples": 12973,
+    "train_samples_per_second": 3.359,
+    "train_steps_per_second": 0.21
+}

eval_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 2.466091245376079,
+    "eval_loss": 0.3112793266773224,
+    "eval_runtime": 1173.9261,
+    "eval_samples": 3612,
+    "eval_samples_per_second": 3.077,
+    "eval_steps_per_second": 0.193,
+    "eval_wer": 0.12829864835872132
+}

train_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 2.466091245376079,
+    "total_flos": 3.265323341119488e+19,
+    "train_loss": 0.2021937195956707,
+    "train_runtime": 9527.7148,
+    "train_samples": 12973,
+    "train_samples_per_second": 3.359,
+    "train_steps_per_second": 0.21
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,621 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.466091245376079,
+  "eval_steps": 1000,
+  "global_step": 2000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.030826140567200986,
+      "grad_norm": 11.499724388122559,
+      "learning_rate": 4.4e-07,
+      "loss": 1.2454,
+      "step": 25
+    },
+    {
+      "epoch": 0.06165228113440197,
+      "grad_norm": 8.96716594696045,
+      "learning_rate": 9.400000000000001e-07,
+      "loss": 1.0189,
+      "step": 50
+    },
+    {
+      "epoch": 0.09247842170160296,
+      "grad_norm": 7.870485305786133,
+      "learning_rate": 1.44e-06,
+      "loss": 0.8525,
+      "step": 75
+    },
+    {
+      "epoch": 0.12330456226880394,
+      "grad_norm": 6.292770862579346,
+      "learning_rate": 1.94e-06,
+      "loss": 0.6987,
+      "step": 100
+    },
+    {
+      "epoch": 0.15413070283600494,
+      "grad_norm": 6.656809329986572,
+      "learning_rate": 2.4400000000000004e-06,
+      "loss": 0.6285,
+      "step": 125
+    },
+    {
+      "epoch": 0.18495684340320592,
+      "grad_norm": 6.315510272979736,
+      "learning_rate": 2.9400000000000002e-06,
+      "loss": 0.6055,
+      "step": 150
+    },
+    {
+      "epoch": 0.2157829839704069,
+      "grad_norm": 7.333935737609863,
+      "learning_rate": 3.44e-06,
+      "loss": 0.5517,
+      "step": 175
+    },
+    {
+      "epoch": 0.2466091245376079,
+      "grad_norm": 7.557521820068359,
+      "learning_rate": 3.94e-06,
+      "loss": 0.4966,
+      "step": 200
+    },
+    {
+      "epoch": 0.27743526510480887,
+      "grad_norm": 5.930201053619385,
+      "learning_rate": 4.440000000000001e-06,
+      "loss": 0.4821,
+      "step": 225
+    },
+    {
+      "epoch": 0.3082614056720099,
+      "grad_norm": 6.367243766784668,
+      "learning_rate": 4.94e-06,
+      "loss": 0.4661,
+      "step": 250
+    },
+    {
+      "epoch": 0.33908754623921084,
+      "grad_norm": 6.376411437988281,
+      "learning_rate": 5.4400000000000004e-06,
+      "loss": 0.4417,
+      "step": 275
+    },
+    {
+      "epoch": 0.36991368680641185,
+      "grad_norm": 5.1631574630737305,
+      "learning_rate": 5.94e-06,
+      "loss": 0.4297,
+      "step": 300
+    },
+    {
+      "epoch": 0.4007398273736128,
+      "grad_norm": 5.0071330070495605,
+      "learning_rate": 6.440000000000001e-06,
+      "loss": 0.3914,
+      "step": 325
+    },
+    {
+      "epoch": 0.4315659679408138,
+      "grad_norm": 4.759220123291016,
+      "learning_rate": 6.9400000000000005e-06,
+      "loss": 0.3548,
+      "step": 350
+    },
+    {
+      "epoch": 0.4623921085080148,
+      "grad_norm": 5.040701389312744,
+      "learning_rate": 7.440000000000001e-06,
+      "loss": 0.3546,
+      "step": 375
+    },
+    {
+      "epoch": 0.4932182490752158,
+      "grad_norm": 5.04915189743042,
+      "learning_rate": 7.94e-06,
+      "loss": 0.3388,
+      "step": 400
+    },
+    {
+      "epoch": 0.5240443896424167,
+      "grad_norm": 5.2604546546936035,
+      "learning_rate": 8.44e-06,
+      "loss": 0.3048,
+      "step": 425
+    },
+    {
+      "epoch": 0.5548705302096177,
+      "grad_norm": 5.409047603607178,
+      "learning_rate": 8.94e-06,
+      "loss": 0.3204,
+      "step": 450
+    },
+    {
+      "epoch": 0.5856966707768188,
+      "grad_norm": 7.095681190490723,
+      "learning_rate": 9.440000000000001e-06,
+      "loss": 0.2962,
+      "step": 475
+    },
+    {
+      "epoch": 0.6165228113440198,
+      "grad_norm": 5.518855571746826,
+      "learning_rate": 9.940000000000001e-06,
+      "loss": 0.2854,
+      "step": 500
+    },
+    {
+      "epoch": 0.6473489519112207,
+      "grad_norm": 5.083781719207764,
+      "learning_rate": 9.853333333333334e-06,
+      "loss": 0.2816,
+      "step": 525
+    },
+    {
+      "epoch": 0.6781750924784217,
+      "grad_norm": 4.599233150482178,
+      "learning_rate": 9.686666666666668e-06,
+      "loss": 0.2804,
+      "step": 550
+    },
+    {
+      "epoch": 0.7090012330456227,
+      "grad_norm": 5.882887840270996,
+      "learning_rate": 9.52e-06,
+      "loss": 0.254,
+      "step": 575
+    },
+    {
+      "epoch": 0.7398273736128237,
+      "grad_norm": 3.953178644180298,
+      "learning_rate": 9.353333333333334e-06,
+      "loss": 0.2522,
+      "step": 600
+    },
+    {
+      "epoch": 0.7706535141800247,
+      "grad_norm": 3.6629250049591064,
+      "learning_rate": 9.186666666666666e-06,
+      "loss": 0.2217,
+      "step": 625
+    },
+    {
+      "epoch": 0.8014796547472256,
+      "grad_norm": 5.168231010437012,
+      "learning_rate": 9.020000000000002e-06,
+      "loss": 0.2451,
+      "step": 650
+    },
+    {
+      "epoch": 0.8323057953144266,
+      "grad_norm": 4.211165904998779,
+      "learning_rate": 8.853333333333334e-06,
+      "loss": 0.216,
+      "step": 675
+    },
+    {
+      "epoch": 0.8631319358816276,
+      "grad_norm": 4.873836994171143,
+      "learning_rate": 8.686666666666668e-06,
+      "loss": 0.2027,
+      "step": 700
+    },
+    {
+      "epoch": 0.8939580764488286,
+      "grad_norm": 4.061721324920654,
+      "learning_rate": 8.52e-06,
+      "loss": 0.2184,
+      "step": 725
+    },
+    {
+      "epoch": 0.9247842170160296,
+      "grad_norm": 5.536831855773926,
+      "learning_rate": 8.353333333333335e-06,
+      "loss": 0.2212,
+      "step": 750
+    },
+    {
+      "epoch": 0.9556103575832305,
+      "grad_norm": 3.8625235557556152,
+      "learning_rate": 8.186666666666667e-06,
+      "loss": 0.1874,
+      "step": 775
+    },
+    {
+      "epoch": 0.9864364981504316,
+      "grad_norm": 4.030850887298584,
+      "learning_rate": 8.020000000000001e-06,
+      "loss": 0.1962,
+      "step": 800
+    },
+    {
+      "epoch": 1.0172626387176325,
+      "grad_norm": 3.3085479736328125,
+      "learning_rate": 7.853333333333333e-06,
+      "loss": 0.1508,
+      "step": 825
+    },
+    {
+      "epoch": 1.0480887792848335,
+      "grad_norm": 3.4279379844665527,
+      "learning_rate": 7.686666666666667e-06,
+      "loss": 0.0925,
+      "step": 850
+    },
+    {
+      "epoch": 1.0789149198520345,
+      "grad_norm": 3.8404757976531982,
+      "learning_rate": 7.520000000000001e-06,
+      "loss": 0.1182,
+      "step": 875
+    },
+    {
+      "epoch": 1.1097410604192355,
+      "grad_norm": 3.7630670070648193,
+      "learning_rate": 7.353333333333334e-06,
+      "loss": 0.1136,
+      "step": 900
+    },
+    {
+      "epoch": 1.1405672009864365,
+      "grad_norm": 3.491826295852661,
+      "learning_rate": 7.186666666666668e-06,
+      "loss": 0.1069,
+      "step": 925
+    },
+    {
+      "epoch": 1.1713933415536375,
+      "grad_norm": 2.2027463912963867,
+      "learning_rate": 7.0200000000000006e-06,
+      "loss": 0.1048,
+      "step": 950
+    },
+    {
+      "epoch": 1.2022194821208385,
+      "grad_norm": 4.981961250305176,
+      "learning_rate": 6.853333333333334e-06,
+      "loss": 0.1141,
+      "step": 975
+    },
+    {
+      "epoch": 1.2330456226880395,
+      "grad_norm": 3.4486851692199707,
+      "learning_rate": 6.6866666666666665e-06,
+      "loss": 0.1001,
+      "step": 1000
+    },
+    {
+      "epoch": 1.2330456226880395,
+      "eval_loss": 0.30403050780296326,
+      "eval_runtime": 1181.2571,
+      "eval_samples_per_second": 3.058,
+      "eval_steps_per_second": 0.191,
+      "eval_wer": 0.14332880402393383,
+      "step": 1000
+    },
+    {
+      "epoch": 1.2638717632552403,
+      "grad_norm": 2.620025396347046,
+      "learning_rate": 6.520000000000001e-06,
+      "loss": 0.0916,
+      "step": 1025
+    },
+    {
+      "epoch": 1.2946979038224415,
+      "grad_norm": 3.629256248474121,
+      "learning_rate": 6.353333333333333e-06,
+      "loss": 0.0949,
+      "step": 1050
+    },
+    {
+      "epoch": 1.3255240443896423,
+      "grad_norm": 2.832113265991211,
+      "learning_rate": 6.186666666666668e-06,
+      "loss": 0.084,
+      "step": 1075
+    },
+    {
+      "epoch": 1.3563501849568433,
+      "grad_norm": 3.5080323219299316,
+      "learning_rate": 6.02e-06,
+      "loss": 0.0881,
+      "step": 1100
+    },
+    {
+      "epoch": 1.3871763255240444,
+      "grad_norm": 3.9893321990966797,
+      "learning_rate": 5.853333333333335e-06,
+      "loss": 0.0781,
+      "step": 1125
+    },
+    {
+      "epoch": 1.4180024660912454,
+      "grad_norm": 2.786031723022461,
+      "learning_rate": 5.686666666666667e-06,
+      "loss": 0.0852,
+      "step": 1150
+    },
+    {
+      "epoch": 1.4488286066584464,
+      "grad_norm": 2.333205461502075,
+      "learning_rate": 5.5200000000000005e-06,
+      "loss": 0.0759,
+      "step": 1175
+    },
+    {
+      "epoch": 1.4796547472256474,
+      "grad_norm": 3.204261302947998,
+      "learning_rate": 5.3533333333333335e-06,
+      "loss": 0.0865,
+      "step": 1200
+    },
+    {
+      "epoch": 1.5104808877928484,
+      "grad_norm": 3.2963826656341553,
+      "learning_rate": 5.186666666666667e-06,
+      "loss": 0.0757,
+      "step": 1225
+    },
+    {
+      "epoch": 1.5413070283600492,
+      "grad_norm": 2.5825254917144775,
+      "learning_rate": 5.02e-06,
+      "loss": 0.0717,
+      "step": 1250
+    },
+    {
+      "epoch": 1.5721331689272504,
+      "grad_norm": 2.7192881107330322,
+      "learning_rate": 4.853333333333334e-06,
+      "loss": 0.0722,
+      "step": 1275
+    },
+    {
+      "epoch": 1.6029593094944512,
+      "grad_norm": 2.911716938018799,
+      "learning_rate": 4.686666666666667e-06,
+      "loss": 0.0757,
+      "step": 1300
+    },
+    {
+      "epoch": 1.6337854500616524,
+      "grad_norm": 2.1598548889160156,
+      "learning_rate": 4.520000000000001e-06,
+      "loss": 0.0704,
+      "step": 1325
+    },
+    {
+      "epoch": 1.6646115906288532,
+      "grad_norm": 2.1722934246063232,
+      "learning_rate": 4.353333333333334e-06,
+      "loss": 0.0621,
+      "step": 1350
+    },
+    {
+      "epoch": 1.6954377311960542,
+      "grad_norm": 2.0885589122772217,
+      "learning_rate": 4.1866666666666675e-06,
+      "loss": 0.0737,
+      "step": 1375
+    },
+    {
+      "epoch": 1.7262638717632552,
+      "grad_norm": 3.2038285732269287,
+      "learning_rate": 4.0200000000000005e-06,
+      "loss": 0.0729,
+      "step": 1400
+    },
+    {
+      "epoch": 1.7570900123304563,
+      "grad_norm": 2.2708075046539307,
+      "learning_rate": 3.853333333333334e-06,
+      "loss": 0.0571,
+      "step": 1425
+    },
+    {
+      "epoch": 1.7879161528976573,
+      "grad_norm": 1.496151089668274,
+      "learning_rate": 3.686666666666667e-06,
+      "loss": 0.0532,
+      "step": 1450
+    },
+    {
+      "epoch": 1.818742293464858,
+      "grad_norm": 1.8642607927322388,
+      "learning_rate": 3.52e-06,
+      "loss": 0.0544,
+      "step": 1475
+    },
+    {
+      "epoch": 1.8495684340320593,
+      "grad_norm": 2.1302435398101807,
+      "learning_rate": 3.3533333333333336e-06,
+      "loss": 0.0425,
+      "step": 1500
+    },
+    {
+      "epoch": 1.88039457459926,
+      "grad_norm": 1.2720330953598022,
+      "learning_rate": 3.186666666666667e-06,
+      "loss": 0.0486,
+      "step": 1525
+    },
+    {
+      "epoch": 1.9112207151664613,
+      "grad_norm": 1.3626000881195068,
+      "learning_rate": 3.0200000000000003e-06,
+      "loss": 0.0482,
+      "step": 1550
+    },
+    {
+      "epoch": 1.942046855733662,
+      "grad_norm": 2.652956485748291,
+      "learning_rate": 2.8533333333333337e-06,
+      "loss": 0.047,
+      "step": 1575
+    },
+    {
+      "epoch": 1.972872996300863,
+      "grad_norm": 2.178326368331909,
+      "learning_rate": 2.686666666666667e-06,
+      "loss": 0.0543,
+      "step": 1600
+    },
+    {
+      "epoch": 2.003699136868064,
+      "grad_norm": 0.6113713979721069,
+      "learning_rate": 2.52e-06,
+      "loss": 0.0416,
+      "step": 1625
+    },
+    {
+      "epoch": 2.034525277435265,
+      "grad_norm": 1.6302359104156494,
+      "learning_rate": 2.3533333333333334e-06,
+      "loss": 0.0167,
+      "step": 1650
+    },
+    {
+      "epoch": 2.065351418002466,
+      "grad_norm": 0.9459154605865479,
+      "learning_rate": 2.1866666666666668e-06,
+      "loss": 0.0137,
+      "step": 1675
+    },
+    {
+      "epoch": 2.096177558569667,
+      "grad_norm": 1.4943691492080688,
+      "learning_rate": 2.02e-06,
+      "loss": 0.0159,
+      "step": 1700
+    },
+    {
+      "epoch": 2.127003699136868,
+      "grad_norm": 0.5425832867622375,
+      "learning_rate": 1.8533333333333333e-06,
+      "loss": 0.0152,
+      "step": 1725
+    },
+    {
+      "epoch": 2.157829839704069,
+      "grad_norm": 1.4946790933609009,
+      "learning_rate": 1.6866666666666667e-06,
+      "loss": 0.0146,
+      "step": 1750
+    },
+    {
+      "epoch": 2.18865598027127,
+      "grad_norm": 0.9100169539451599,
+      "learning_rate": 1.52e-06,
+      "loss": 0.0191,
+      "step": 1775
+    },
+    {
+      "epoch": 2.219482120838471,
+      "grad_norm": 1.2448313236236572,
+      "learning_rate": 1.3533333333333334e-06,
+      "loss": 0.0159,
+      "step": 1800
+    },
+    {
+      "epoch": 2.250308261405672,
+      "grad_norm": 0.9976411461830139,
+      "learning_rate": 1.1866666666666668e-06,
+      "loss": 0.0203,
+      "step": 1825
+    },
+    {
+      "epoch": 2.281134401972873,
+      "grad_norm": 1.358780860900879,
+      "learning_rate": 1.02e-06,
+      "loss": 0.0139,
+      "step": 1850
+    },
+    {
+      "epoch": 2.311960542540074,
+      "grad_norm": 1.2800226211547852,
+      "learning_rate": 8.533333333333334e-07,
+      "loss": 0.0175,
+      "step": 1875
+    },
+    {
+      "epoch": 2.342786683107275,
+      "grad_norm": 1.007161021232605,
+      "learning_rate": 6.866666666666667e-07,
+      "loss": 0.013,
+      "step": 1900
+    },
+    {
+      "epoch": 2.373612823674476,
+      "grad_norm": 1.1838051080703735,
+      "learning_rate": 5.2e-07,
+      "loss": 0.0144,
+      "step": 1925
+    },
+    {
+      "epoch": 2.404438964241677,
+      "grad_norm": 1.2872673273086548,
+      "learning_rate": 3.533333333333334e-07,
+      "loss": 0.0134,
+      "step": 1950
+    },
+    {
+      "epoch": 2.435265104808878,
+      "grad_norm": 0.7094443440437317,
+      "learning_rate": 1.866666666666667e-07,
+      "loss": 0.0123,
+      "step": 1975
+    },
+    {
+      "epoch": 2.466091245376079,
+      "grad_norm": 0.6137486696243286,
+      "learning_rate": 2e-08,
+      "loss": 0.0125,
+      "step": 2000
+    },
+    {
+      "epoch": 2.466091245376079,
+      "eval_loss": 0.3112793266773224,
+      "eval_runtime": 1182.7026,
+      "eval_samples_per_second": 3.054,
+      "eval_steps_per_second": 0.191,
+      "eval_wer": 0.12829864835872132,
+      "step": 2000
+    },
+    {
+      "epoch": 2.466091245376079,
+      "step": 2000,
+      "total_flos": 3.265323341119488e+19,
+      "train_loss": 0.2021937195956707,
+      "train_runtime": 9527.7148,
+      "train_samples_per_second": 3.359,
+      "train_steps_per_second": 0.21
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 2000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 1000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.265323341119488e+19,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}