razhan commited on
Commit
5725a17
·
verified ·
1 Parent(s): 2b22d36

End of training

Browse files
Files changed (5) hide show
  1. README.md +15 -2
  2. all_results.json +13 -14
  3. eval_results.json +7 -7
  4. train_results.json +7 -7
  5. trainer_state.json +126 -74
README.md CHANGED
@@ -4,11 +4,24 @@ license: apache-2.0
4
  base_model: openai/whisper-base
5
  tags:
6
  - generated_from_trainer
 
 
7
  metrics:
8
  - wer
9
  model-index:
10
  - name: whisper-base-hac
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,7 +29,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # whisper-base-hac
18
 
19
- This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.3272
22
  - Wer: 0.4792
 
4
  base_model: openai/whisper-base
5
  tags:
6
  - generated_from_trainer
7
+ datasets:
8
+ - razhan/DOLMA-speech
9
  metrics:
10
  - wer
11
  model-index:
12
  - name: whisper-base-hac
13
+ results:
14
+ - task:
15
+ name: Automatic Speech Recognition
16
+ type: automatic-speech-recognition
17
+ dataset:
18
+ name: razhan/DOLMA-speech hawrami
19
+ type: razhan/DOLMA-speech
20
+ args: hawrami
21
+ metrics:
22
+ - name: Wer
23
+ type: wer
24
+ value: 0.47917770477906113
25
  ---
26
 
27
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
29
 
30
  # whisper-base-hac
31
 
32
+ This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the razhan/DOLMA-speech hawrami dataset.
33
  It achieves the following results on the evaluation set:
34
  - Loss: 0.3272
35
  - Wer: 0.4792
all_results.json CHANGED
@@ -1,17 +1,16 @@
1
  {
2
- "epoch": 4.0,
3
- "eval_cer": 0.26081384171739824,
4
- "eval_loss": 0.8250513076782227,
5
- "eval_model_preparation_time": 0.0031,
6
- "eval_runtime": 88.7908,
7
  "eval_samples": 1263,
8
- "eval_samples_per_second": 14.224,
9
- "eval_steps_per_second": 0.056,
10
- "eval_wer": 0.9221150789445799,
11
- "total_flos": 1.261916109448151e+18,
12
- "train_loss": 2.151222774856969,
13
- "train_runtime": 1211.2403,
14
- "train_samples": 4773,
15
- "train_samples_per_second": 15.762,
16
- "train_steps_per_second": 0.063
17
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_cer": 0.10385057579584221,
4
+ "eval_loss": 0.32716336846351624,
5
+ "eval_runtime": 86.6976,
 
6
  "eval_samples": 1263,
7
+ "eval_samples_per_second": 14.568,
8
+ "eval_steps_per_second": 0.058,
9
+ "eval_wer": 0.47917770477906113,
10
+ "total_flos": 3.3623422081150484e+18,
11
+ "train_loss": 0.8413535683243363,
12
+ "train_runtime": 3448.7065,
13
+ "train_samples": 10165,
14
+ "train_samples_per_second": 14.737,
15
+ "train_steps_per_second": 0.039
16
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "eval_cer": 0.26081384171739824,
3
- "eval_loss": 0.8250513076782227,
4
- "eval_model_preparation_time": 0.0031,
5
- "eval_runtime": 88.7908,
6
  "eval_samples": 1263,
7
- "eval_samples_per_second": 14.224,
8
- "eval_steps_per_second": 0.056,
9
- "eval_wer": 0.9221150789445799
10
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_cer": 0.10385057579584221,
4
+ "eval_loss": 0.32716336846351624,
5
+ "eval_runtime": 86.6976,
6
  "eval_samples": 1263,
7
+ "eval_samples_per_second": 14.568,
8
+ "eval_steps_per_second": 0.058,
9
+ "eval_wer": 0.47917770477906113
10
  }
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 4.0,
3
- "total_flos": 1.261916109448151e+18,
4
- "train_loss": 2.151222774856969,
5
- "train_runtime": 1211.2403,
6
- "train_samples": 4773,
7
- "train_samples_per_second": 15.762,
8
- "train_steps_per_second": 0.063
9
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "total_flos": 3.3623422081150484e+18,
4
+ "train_loss": 0.8413535683243363,
5
+ "train_runtime": 3448.7065,
6
+ "train_samples": 10165,
7
+ "train_samples_per_second": 14.737,
8
+ "train_steps_per_second": 0.039
9
  }
trainer_state.json CHANGED
@@ -1,116 +1,168 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 76,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.5263157894736842,
13
- "grad_norm": 64.39277648925781,
14
- "learning_rate": 4.0000000000000003e-07,
15
- "loss": 3.6464,
16
  "step": 10
17
  },
18
  {
19
- "epoch": 1.0,
20
- "eval_cer": 0.45834372661511597,
21
- "eval_loss": 3.158611297607422,
22
- "eval_runtime": 19.3102,
23
- "eval_samples_per_second": 10.564,
24
- "eval_steps_per_second": 0.052,
25
- "eval_wer": 0.9852579852579852,
26
- "step": 19
27
- },
28
- {
29
- "epoch": 1.0526315789473684,
30
- "grad_norm": 47.9715576171875,
31
- "learning_rate": 1.4000000000000001e-06,
32
- "loss": 3.405,
33
  "step": 20
34
  },
35
  {
36
- "epoch": 1.5789473684210527,
37
- "grad_norm": 30.349884033203125,
38
- "learning_rate": 2.4000000000000003e-06,
39
- "loss": 2.797,
40
- "step": 30
 
 
 
41
  },
42
  {
43
- "epoch": 2.0,
44
- "eval_cer": 0.4428785233225243,
45
- "eval_loss": 2.0119194984436035,
46
- "eval_runtime": 18.2983,
47
- "eval_samples_per_second": 11.149,
48
- "eval_steps_per_second": 0.055,
49
- "eval_wer": 0.9963144963144963,
50
- "step": 38
51
  },
52
  {
53
- "epoch": 2.1052631578947367,
54
- "grad_norm": 24.85350227355957,
55
- "learning_rate": 3.4000000000000005e-06,
56
- "loss": 2.1901,
57
  "step": 40
58
  },
59
  {
60
- "epoch": 2.6315789473684212,
61
- "grad_norm": 15.238232612609863,
62
- "learning_rate": 4.4e-06,
63
- "loss": 1.6366,
64
  "step": 50
65
  },
66
  {
67
- "epoch": 3.0,
68
- "eval_cer": 0.3800199551010227,
69
- "eval_loss": 1.2072163820266724,
70
- "eval_runtime": 17.6074,
71
- "eval_samples_per_second": 11.586,
72
  "eval_steps_per_second": 0.057,
73
- "eval_wer": 0.992014742014742,
74
- "step": 57
75
  },
76
  {
77
- "epoch": 3.1578947368421053,
78
- "grad_norm": 8.841925621032715,
79
- "learning_rate": 5.400000000000001e-06,
80
- "loss": 1.2455,
81
  "step": 60
82
  },
83
  {
84
- "epoch": 3.6842105263157894,
85
- "grad_norm": 4.40842342376709,
86
- "learning_rate": 6.4000000000000006e-06,
87
- "loss": 0.9577,
88
  "step": 70
89
  },
90
  {
91
- "epoch": 4.0,
92
- "eval_cer": 0.24893988525816912,
93
- "eval_loss": 0.7948786020278931,
94
- "eval_runtime": 16.9884,
95
- "eval_samples_per_second": 12.008,
96
- "eval_steps_per_second": 0.059,
97
- "eval_wer": 0.8052825552825553,
98
- "step": 76
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
  },
100
  {
101
  "epoch": 4.0,
102
- "step": 76,
103
- "total_flos": 1.261916109448151e+18,
104
- "train_loss": 2.151222774856969,
105
- "train_runtime": 1211.2403,
106
- "train_samples_per_second": 15.762,
107
- "train_steps_per_second": 0.063
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
108
  }
109
  ],
110
  "logging_steps": 10,
111
- "max_steps": 76,
112
  "num_input_tokens_seen": 0,
113
- "num_train_epochs": 4,
114
  "save_steps": 500,
115
  "stateful_callbacks": {
116
  "TrainerControl": {
@@ -124,8 +176,8 @@
124
  "attributes": {}
125
  }
126
  },
127
- "total_flos": 1.261916109448151e+18,
128
- "train_batch_size": 128,
129
  "trial_name": null,
130
  "trial_params": null
131
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 135,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.37037037037037035,
13
+ "grad_norm": 34.00384521484375,
14
+ "learning_rate": 9.776119402985076e-06,
15
+ "loss": 3.5666,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.7407407407407407,
20
+ "grad_norm": 14.095426559448242,
21
+ "learning_rate": 9.029850746268657e-06,
22
+ "loss": 1.9468,
 
 
 
 
 
 
 
 
 
 
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 1.0,
27
+ "eval_cer": 0.3796859980775393,
28
+ "eval_loss": 0.9999122619628906,
29
+ "eval_runtime": 91.0467,
30
+ "eval_samples_per_second": 13.872,
31
+ "eval_steps_per_second": 0.055,
32
+ "eval_wer": 0.9633358058705097,
33
+ "step": 27
34
  },
35
  {
36
+ "epoch": 1.1111111111111112,
37
+ "grad_norm": 6.282424449920654,
38
+ "learning_rate": 8.283582089552239e-06,
39
+ "loss": 1.1917,
40
+ "step": 30
 
 
 
41
  },
42
  {
43
+ "epoch": 1.4814814814814814,
44
+ "grad_norm": 4.256287574768066,
45
+ "learning_rate": 7.537313432835821e-06,
46
+ "loss": 0.8244,
47
  "step": 40
48
  },
49
  {
50
+ "epoch": 1.8518518518518519,
51
+ "grad_norm": 2.4645814895629883,
52
+ "learning_rate": 6.791044776119403e-06,
53
+ "loss": 0.6132,
54
  "step": 50
55
  },
56
  {
57
+ "epoch": 2.0,
58
+ "eval_cer": 0.1469174661213412,
59
+ "eval_loss": 0.468128502368927,
60
+ "eval_runtime": 87.6022,
61
+ "eval_samples_per_second": 14.417,
62
  "eval_steps_per_second": 0.057,
63
+ "eval_wer": 0.6078202818692381,
64
+ "step": 54
65
  },
66
  {
67
+ "epoch": 2.2222222222222223,
68
+ "grad_norm": 2.1577141284942627,
69
+ "learning_rate": 6.044776119402986e-06,
70
+ "loss": 0.4936,
71
  "step": 60
72
  },
73
  {
74
+ "epoch": 2.5925925925925926,
75
+ "grad_norm": 2.0963618755340576,
76
+ "learning_rate": 5.298507462686567e-06,
77
+ "loss": 0.4327,
78
  "step": 70
79
  },
80
  {
81
+ "epoch": 2.962962962962963,
82
+ "grad_norm": 1.5172204971313477,
83
+ "learning_rate": 4.5522388059701495e-06,
84
+ "loss": 0.3976,
85
+ "step": 80
86
+ },
87
+ {
88
+ "epoch": 3.0,
89
+ "eval_cer": 0.11282205929472078,
90
+ "eval_loss": 0.366842657327652,
91
+ "eval_runtime": 86.2276,
92
+ "eval_samples_per_second": 14.647,
93
+ "eval_steps_per_second": 0.058,
94
+ "eval_wer": 0.5160538306665253,
95
+ "step": 81
96
+ },
97
+ {
98
+ "epoch": 3.3333333333333335,
99
+ "grad_norm": 1.841143012046814,
100
+ "learning_rate": 3.8059701492537314e-06,
101
+ "loss": 0.3747,
102
+ "step": 90
103
+ },
104
+ {
105
+ "epoch": 3.7037037037037037,
106
+ "grad_norm": 1.7737436294555664,
107
+ "learning_rate": 3.0597014925373137e-06,
108
+ "loss": 0.3485,
109
+ "step": 100
110
  },
111
  {
112
  "epoch": 4.0,
113
+ "eval_cer": 0.10645155210434061,
114
+ "eval_loss": 0.33595842123031616,
115
+ "eval_runtime": 86.4694,
116
+ "eval_samples_per_second": 14.606,
117
+ "eval_steps_per_second": 0.058,
118
+ "eval_wer": 0.488926565645862,
119
+ "step": 108
120
+ },
121
+ {
122
+ "epoch": 4.074074074074074,
123
+ "grad_norm": 1.6087193489074707,
124
+ "learning_rate": 2.3134328358208956e-06,
125
+ "loss": 0.3447,
126
+ "step": 110
127
+ },
128
+ {
129
+ "epoch": 4.444444444444445,
130
+ "grad_norm": 1.753946304321289,
131
+ "learning_rate": 1.5671641791044779e-06,
132
+ "loss": 0.338,
133
+ "step": 120
134
+ },
135
+ {
136
+ "epoch": 4.814814814814815,
137
+ "grad_norm": 1.5161445140838623,
138
+ "learning_rate": 8.208955223880598e-07,
139
+ "loss": 0.3292,
140
+ "step": 130
141
+ },
142
+ {
143
+ "epoch": 5.0,
144
+ "eval_cer": 0.10385057579584221,
145
+ "eval_loss": 0.32716336846351624,
146
+ "eval_runtime": 85.8417,
147
+ "eval_samples_per_second": 14.713,
148
+ "eval_steps_per_second": 0.058,
149
+ "eval_wer": 0.47917770477906113,
150
+ "step": 135
151
+ },
152
+ {
153
+ "epoch": 5.0,
154
+ "step": 135,
155
+ "total_flos": 3.3623422081150484e+18,
156
+ "train_loss": 0.8413535683243363,
157
+ "train_runtime": 3448.7065,
158
+ "train_samples_per_second": 14.737,
159
+ "train_steps_per_second": 0.039
160
  }
161
  ],
162
  "logging_steps": 10,
163
+ "max_steps": 135,
164
  "num_input_tokens_seen": 0,
165
+ "num_train_epochs": 5,
166
  "save_steps": 500,
167
  "stateful_callbacks": {
168
  "TrainerControl": {
 
176
  "attributes": {}
177
  }
178
  },
179
+ "total_flos": 3.3623422081150484e+18,
180
+ "train_batch_size": 192,
181
  "trial_name": null,
182
  "trial_params": null
183
  }