bkh6722 commited on
Commit
1c4de63
·
1 Parent(s): 331d19d

End of training

Browse files
runs/{May17_00-20-06_0d0f38c34c7b → wav2vec-d}/1652746815.4360282/events.out.tfevents.1652746815.0d0f38c34c7b.743.1 RENAMED
File without changes
runs/{May17_00-20-06_0d0f38c34c7b → wav2vec-d}/events.out.tfevents.1652746815.0d0f38c34c7b.743.0 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbdc4322691edf20dae43110e0295655b5d7397bd56dcfec84d1203fdca86545
3
- size 11726
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bfe15d427df26c4987d1235f850532e91beb18f1889de02613287a142ece85d
3
+ size 12080
wav2vec-d/config.json ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/wav2vec2-base-960h",
3
+ "activation_dropout": 0.1,
4
+ "apply_spec_augment": true,
5
+ "architectures": [
6
+ "Wav2Vec2ForCTC"
7
+ ],
8
+ "attention_dropout": 0.5,
9
+ "bos_token_id": 1,
10
+ "classifier_proj_size": 256,
11
+ "codevector_dim": 256,
12
+ "contrastive_logits_temperature": 0.1,
13
+ "conv_bias": false,
14
+ "conv_dim": [
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512,
19
+ 512,
20
+ 512,
21
+ 512
22
+ ],
23
+ "conv_kernel": [
24
+ 10,
25
+ 3,
26
+ 3,
27
+ 3,
28
+ 3,
29
+ 2,
30
+ 2
31
+ ],
32
+ "conv_stride": [
33
+ 5,
34
+ 2,
35
+ 2,
36
+ 2,
37
+ 2,
38
+ 2,
39
+ 2
40
+ ],
41
+ "ctc_loss_reduction": "mean",
42
+ "ctc_zero_infinity": false,
43
+ "diversity_loss_weight": 0.1,
44
+ "do_stable_layer_norm": false,
45
+ "eos_token_id": 2,
46
+ "feat_extract_activation": "gelu",
47
+ "feat_extract_dropout": 0.0,
48
+ "feat_extract_norm": "group",
49
+ "feat_proj_dropout": 0.0,
50
+ "feat_quantizer_dropout": 0.0,
51
+ "final_dropout": 0.1,
52
+ "gradient_checkpointing": false,
53
+ "hidden_act": "gelu",
54
+ "hidden_dropout": 0.0,
55
+ "hidden_dropout_prob": 0.1,
56
+ "hidden_size": 768,
57
+ "initializer_range": 0.02,
58
+ "intermediate_size": 3072,
59
+ "layer_norm_eps": 1e-05,
60
+ "layerdrop": 0.0,
61
+ "mask_feature_length": 10,
62
+ "mask_feature_prob": 0.0,
63
+ "mask_time_length": 10,
64
+ "mask_time_prob": 0.05,
65
+ "model_type": "wav2vec2",
66
+ "num_attention_heads": 12,
67
+ "num_codevector_groups": 2,
68
+ "num_codevectors_per_group": 320,
69
+ "num_conv_pos_embedding_groups": 16,
70
+ "num_conv_pos_embeddings": 128,
71
+ "num_feat_extract_layers": 7,
72
+ "num_hidden_layers": 12,
73
+ "num_negatives": 100,
74
+ "pad_token_id": 24,
75
+ "proj_codevector_dim": 256,
76
+ "torch_dtype": "float32",
77
+ "transformers_version": "4.11.3",
78
+ "use_weighted_layer_sum": false,
79
+ "vocab_size": 32
80
+ }
wav2vec-d/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44eba4955ea0de84ec6524d0a1ac2e5bab02f0b5f6db93700f8bd0c75be0d85b
3
+ size 721685265
wav2vec-d/preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0.0,
7
+ "return_attention_mask": true,
8
+ "sampling_rate": 16000
9
+ }
wav2vec-d/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af2867f74cc5fb8521e8001af14d411e5fcf0f238969256724df83dec44cadbc
3
+ size 377670039
wav2vec-d/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1052e6c582a4388b54ace3638a4762af4511b2382928530d9fc1fab6ffbd910
3
+ size 14567
runs/May17_00-14-36_0d0f38c34c7b/1652746709.7643979/events.out.tfevents.1652746709.0d0f38c34c7b.73.1 → wav2vec-d/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:051b85de044e2277947d70e3b88236854ed38fba011732f65a6ce54f7cb2a8f6
3
- size 4483
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:091b66edd1d5eeac221d1f228e19c194bd6930ca53057e50163f132aef445527
3
+ size 559
runs/May17_00-14-36_0d0f38c34c7b/events.out.tfevents.1652746709.0d0f38c34c7b.73.0 → wav2vec-d/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21e4ba400b95879885bc97f72f11d36d86eada899ba3e90f97695a6ae43584c5
3
- size 4135
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab0e6a5bfa499dc0025c224e8227d915eec5c98624986fcfb52c2e05eb1aa32e
3
+ size 623
wav2vec-d/trainer_state.json ADDED
@@ -0,0 +1,256 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 799.8,
5
+ "global_step": 1600,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 49.8,
12
+ "learning_rate": 5.5799999999999994e-05,
13
+ "loss": 42.4143,
14
+ "step": 100
15
+ },
16
+ {
17
+ "epoch": 49.8,
18
+ "eval_loss": 21.511550903320312,
19
+ "eval_runtime": 22.3742,
20
+ "eval_samples_per_second": 2.413,
21
+ "eval_steps_per_second": 0.313,
22
+ "eval_wer": 1.0,
23
+ "step": 100
24
+ },
25
+ {
26
+ "epoch": 99.8,
27
+ "learning_rate": 0.0001158,
28
+ "loss": 5.9884,
29
+ "step": 200
30
+ },
31
+ {
32
+ "epoch": 99.8,
33
+ "eval_loss": 31.79755401611328,
34
+ "eval_runtime": 0.9499,
35
+ "eval_samples_per_second": 56.846,
36
+ "eval_steps_per_second": 7.369,
37
+ "eval_wer": 1.0,
38
+ "step": 200
39
+ },
40
+ {
41
+ "epoch": 149.8,
42
+ "learning_rate": 0.00017579999999999996,
43
+ "loss": 4.0043,
44
+ "step": 300
45
+ },
46
+ {
47
+ "epoch": 149.8,
48
+ "eval_loss": 3.482863187789917,
49
+ "eval_runtime": 0.9439,
50
+ "eval_samples_per_second": 57.208,
51
+ "eval_steps_per_second": 7.416,
52
+ "eval_wer": 1.0,
53
+ "step": 300
54
+ },
55
+ {
56
+ "epoch": 199.8,
57
+ "learning_rate": 0.00023579999999999999,
58
+ "loss": 3.653,
59
+ "step": 400
60
+ },
61
+ {
62
+ "epoch": 199.8,
63
+ "eval_loss": 3.6417062282562256,
64
+ "eval_runtime": 0.9393,
65
+ "eval_samples_per_second": 57.489,
66
+ "eval_steps_per_second": 7.452,
67
+ "eval_wer": 1.0,
68
+ "step": 400
69
+ },
70
+ {
71
+ "epoch": 249.8,
72
+ "learning_rate": 0.0002958,
73
+ "loss": 3.5207,
74
+ "step": 500
75
+ },
76
+ {
77
+ "epoch": 249.8,
78
+ "eval_loss": 3.508103370666504,
79
+ "eval_runtime": 0.9443,
80
+ "eval_samples_per_second": 57.187,
81
+ "eval_steps_per_second": 7.413,
82
+ "eval_wer": 1.0,
83
+ "step": 500
84
+ },
85
+ {
86
+ "epoch": 299.8,
87
+ "learning_rate": 0.0002746363636363636,
88
+ "loss": 3.63,
89
+ "step": 600
90
+ },
91
+ {
92
+ "epoch": 299.8,
93
+ "eval_loss": 3.4835526943206787,
94
+ "eval_runtime": 0.943,
95
+ "eval_samples_per_second": 57.264,
96
+ "eval_steps_per_second": 7.423,
97
+ "eval_wer": 1.0,
98
+ "step": 600
99
+ },
100
+ {
101
+ "epoch": 349.8,
102
+ "learning_rate": 0.00024736363636363633,
103
+ "loss": 3.648,
104
+ "step": 700
105
+ },
106
+ {
107
+ "epoch": 349.8,
108
+ "eval_loss": 3.4515135288238525,
109
+ "eval_runtime": 0.9803,
110
+ "eval_samples_per_second": 55.084,
111
+ "eval_steps_per_second": 7.141,
112
+ "eval_wer": 1.0,
113
+ "step": 700
114
+ },
115
+ {
116
+ "epoch": 399.8,
117
+ "learning_rate": 0.00022009090909090907,
118
+ "loss": 3.6448,
119
+ "step": 800
120
+ },
121
+ {
122
+ "epoch": 399.8,
123
+ "eval_loss": 3.4646780490875244,
124
+ "eval_runtime": 0.9384,
125
+ "eval_samples_per_second": 57.547,
126
+ "eval_steps_per_second": 7.46,
127
+ "eval_wer": 1.0,
128
+ "step": 800
129
+ },
130
+ {
131
+ "epoch": 449.8,
132
+ "learning_rate": 0.0001928181818181818,
133
+ "loss": 3.6872,
134
+ "step": 900
135
+ },
136
+ {
137
+ "epoch": 449.8,
138
+ "eval_loss": 3.4371423721313477,
139
+ "eval_runtime": 0.938,
140
+ "eval_samples_per_second": 57.568,
141
+ "eval_steps_per_second": 7.463,
142
+ "eval_wer": 1.0,
143
+ "step": 900
144
+ },
145
+ {
146
+ "epoch": 499.8,
147
+ "learning_rate": 0.0001655454545454545,
148
+ "loss": 3.6892,
149
+ "step": 1000
150
+ },
151
+ {
152
+ "epoch": 499.8,
153
+ "eval_loss": 3.4336819648742676,
154
+ "eval_runtime": 0.9476,
155
+ "eval_samples_per_second": 56.988,
156
+ "eval_steps_per_second": 7.387,
157
+ "eval_wer": 1.0,
158
+ "step": 1000
159
+ },
160
+ {
161
+ "epoch": 549.8,
162
+ "learning_rate": 0.00013827272727272728,
163
+ "loss": 3.684,
164
+ "step": 1100
165
+ },
166
+ {
167
+ "epoch": 549.8,
168
+ "eval_loss": 3.437472343444824,
169
+ "eval_runtime": 0.94,
170
+ "eval_samples_per_second": 57.449,
171
+ "eval_steps_per_second": 7.447,
172
+ "eval_wer": 1.0,
173
+ "step": 1100
174
+ },
175
+ {
176
+ "epoch": 599.8,
177
+ "learning_rate": 0.00011099999999999999,
178
+ "loss": 3.6843,
179
+ "step": 1200
180
+ },
181
+ {
182
+ "epoch": 599.8,
183
+ "eval_loss": 3.4452097415924072,
184
+ "eval_runtime": 0.9463,
185
+ "eval_samples_per_second": 57.067,
186
+ "eval_steps_per_second": 7.398,
187
+ "eval_wer": 1.0,
188
+ "step": 1200
189
+ },
190
+ {
191
+ "epoch": 649.8,
192
+ "learning_rate": 8.372727272727272e-05,
193
+ "loss": 3.6842,
194
+ "step": 1300
195
+ },
196
+ {
197
+ "epoch": 649.8,
198
+ "eval_loss": 3.441551446914673,
199
+ "eval_runtime": 0.9462,
200
+ "eval_samples_per_second": 57.068,
201
+ "eval_steps_per_second": 7.398,
202
+ "eval_wer": 1.0,
203
+ "step": 1300
204
+ },
205
+ {
206
+ "epoch": 699.8,
207
+ "learning_rate": 5.645454545454545e-05,
208
+ "loss": 3.6819,
209
+ "step": 1400
210
+ },
211
+ {
212
+ "epoch": 699.8,
213
+ "eval_loss": 3.4498231410980225,
214
+ "eval_runtime": 0.9402,
215
+ "eval_samples_per_second": 57.435,
216
+ "eval_steps_per_second": 7.445,
217
+ "eval_wer": 1.0,
218
+ "step": 1400
219
+ },
220
+ {
221
+ "epoch": 749.8,
222
+ "learning_rate": 2.918181818181818e-05,
223
+ "loss": 3.6832,
224
+ "step": 1500
225
+ },
226
+ {
227
+ "epoch": 749.8,
228
+ "eval_loss": 3.4524271488189697,
229
+ "eval_runtime": 0.9511,
230
+ "eval_samples_per_second": 56.778,
231
+ "eval_steps_per_second": 7.36,
232
+ "eval_wer": 1.0,
233
+ "step": 1500
234
+ },
235
+ {
236
+ "epoch": 799.8,
237
+ "learning_rate": 1.909090909090909e-06,
238
+ "loss": 3.6828,
239
+ "step": 1600
240
+ },
241
+ {
242
+ "epoch": 799.8,
243
+ "eval_loss": 3.4495346546173096,
244
+ "eval_runtime": 0.9541,
245
+ "eval_samples_per_second": 56.598,
246
+ "eval_steps_per_second": 7.337,
247
+ "eval_wer": 1.0,
248
+ "step": 1600
249
+ }
250
+ ],
251
+ "max_steps": 1600,
252
+ "num_train_epochs": 800,
253
+ "total_flos": 1.8719390163492864e+18,
254
+ "trial_name": null,
255
+ "trial_params": null
256
+ }
wav2vec-d/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19f0c582e5da6613da0735544fb140f0f7217fc13b5e3427db24f1d7c8b22440
3
+ size 2799