JaratX commited on
Commit
4ec0bf9
·
1 Parent(s): e0cf9f1

Delete transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490

Browse files
transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490/config.json DELETED
@@ -1,82 +0,0 @@
1
- {
2
- "_name_or_path": "facebook/w2v-bert-2.0",
3
- "activation_dropout": 0.0,
4
- "adapter_act": "relu",
5
- "adapter_kernel_size": 3,
6
- "adapter_stride": 2,
7
- "add_adapter": true,
8
- "apply_spec_augment": false,
9
- "architectures": [
10
- "Wav2Vec2BertForCTC"
11
- ],
12
- "attention_dropout": 0.0,
13
- "bos_token_id": 1,
14
- "classifier_proj_size": 768,
15
- "codevector_dim": 768,
16
- "conformer_conv_dropout": 0.1,
17
- "contrastive_logits_temperature": 0.1,
18
- "conv_depthwise_kernel_size": 31,
19
- "ctc_loss_reduction": "mean",
20
- "ctc_zero_infinity": false,
21
- "diversity_loss_weight": 0.1,
22
- "eos_token_id": 2,
23
- "feat_proj_dropout": 0.0,
24
- "feat_quantizer_dropout": 0.0,
25
- "feature_projection_input_dim": 160,
26
- "final_dropout": 0.1,
27
- "hidden_act": "swish",
28
- "hidden_dropout": 0.0,
29
- "hidden_size": 1024,
30
- "initializer_range": 0.02,
31
- "intermediate_size": 4096,
32
- "layer_norm_eps": 1e-05,
33
- "layerdrop": 0.0,
34
- "left_max_position_embeddings": 64,
35
- "mask_feature_length": 10,
36
- "mask_feature_min_masks": 0,
37
- "mask_feature_prob": 0.0,
38
- "mask_time_length": 10,
39
- "mask_time_min_masks": 2,
40
- "mask_time_prob": 0.0,
41
- "max_source_positions": 5000,
42
- "model_type": "wav2vec2-bert",
43
- "num_adapter_layers": 1,
44
- "num_attention_heads": 16,
45
- "num_codevector_groups": 2,
46
- "num_codevectors_per_group": 320,
47
- "num_hidden_layers": 24,
48
- "num_negatives": 100,
49
- "output_hidden_size": 1024,
50
- "pad_token_id": 55,
51
- "position_embeddings_type": "relative_key",
52
- "proj_codevector_dim": 768,
53
- "right_max_position_embeddings": 8,
54
- "rotary_embedding_base": 10000,
55
- "tdnn_dilation": [
56
- 1,
57
- 2,
58
- 3,
59
- 1,
60
- 1
61
- ],
62
- "tdnn_dim": [
63
- 512,
64
- 512,
65
- 512,
66
- 512,
67
- 1500
68
- ],
69
- "tdnn_kernel": [
70
- 5,
71
- 3,
72
- 3,
73
- 1,
74
- 1
75
- ],
76
- "torch_dtype": "float32",
77
- "transformers_version": "4.46.3",
78
- "use_intermediate_ffn_before_adapter": false,
79
- "use_weighted_layer_sum": false,
80
- "vocab_size": 58,
81
- "xvector_output_dim": 512
82
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490/preprocessor_config.json DELETED
@@ -1,10 +0,0 @@
1
- {
2
- "feature_extractor_type": "SeamlessM4TFeatureExtractor",
3
- "feature_size": 80,
4
- "num_mel_bins": 80,
5
- "padding_side": "right",
6
- "padding_value": 0.0,
7
- "return_attention_mask": true,
8
- "sampling_rate": 16000,
9
- "stride": 2
10
- }
 
 
 
 
 
 
 
 
 
 
 
transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2a812a278c72cb787298245f122ab589285b867cb9fb13812819e443341549a
3
- size 14244
 
 
 
 
transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a83b4666c22523603f0a60b34d13d8692110ae1c6107f863de3447d27acb008b
3
- size 1064
 
 
 
 
transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490/trainer_state.json DELETED
@@ -1,220 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 10.99630996309963,
5
- "eval_steps": 500,
6
- "global_step": 1490,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.996309963099631,
13
- "grad_norm": 6.060778617858887,
14
- "learning_rate": 1.3100000000000002e-05,
15
- "loss": 4.0745,
16
- "step": 135
17
- },
18
- {
19
- "epoch": 0.996309963099631,
20
- "eval_loss": 2.8919060230255127,
21
- "eval_pen_wer": 0.9288469971028115,
22
- "eval_runtime": 35.4574,
23
- "eval_samples_per_second": 7.643,
24
- "eval_steps_per_second": 0.959,
25
- "eval_wer": 0.9983822042467139,
26
- "step": 135
27
- },
28
- {
29
- "epoch": 2.0,
30
- "grad_norm": 32.26631164550781,
31
- "learning_rate": 2.6700000000000002e-05,
32
- "loss": 1.9077,
33
- "step": 271
34
- },
35
- {
36
- "epoch": 2.0,
37
- "eval_loss": 1.279911756515503,
38
- "eval_pen_wer": 0.4244393978114909,
39
- "eval_runtime": 36.3495,
40
- "eval_samples_per_second": 7.455,
41
- "eval_steps_per_second": 0.935,
42
- "eval_wer": 0.6604651162790698,
43
- "step": 271
44
- },
45
- {
46
- "epoch": 2.9963099630996313,
47
- "grad_norm": 5.846123218536377,
48
- "learning_rate": 4.02e-05,
49
- "loss": 1.2007,
50
- "step": 406
51
- },
52
- {
53
- "epoch": 2.9963099630996313,
54
- "eval_loss": 1.1114612817764282,
55
- "eval_pen_wer": 0.36216589798996246,
56
- "eval_runtime": 36.7217,
57
- "eval_samples_per_second": 7.38,
58
- "eval_steps_per_second": 0.926,
59
- "eval_wer": 0.5937984496124031,
60
- "step": 406
61
- },
62
- {
63
- "epoch": 4.0,
64
- "grad_norm": 7.9398193359375,
65
- "learning_rate": 4.8303571428571434e-05,
66
- "loss": 1.0249,
67
- "step": 542
68
- },
69
- {
70
- "epoch": 4.0,
71
- "eval_loss": 1.0737940073013306,
72
- "eval_pen_wer": 0.34027092257628144,
73
- "eval_runtime": 36.6597,
74
- "eval_samples_per_second": 7.392,
75
- "eval_steps_per_second": 0.927,
76
- "eval_wer": 0.5542298618132794,
77
- "step": 542
78
- },
79
- {
80
- "epoch": 4.996309963099631,
81
- "grad_norm": 5.927522659301758,
82
- "learning_rate": 4.2276785714285714e-05,
83
- "loss": 0.8813,
84
- "step": 677
85
- },
86
- {
87
- "epoch": 4.996309963099631,
88
- "eval_loss": 1.0277714729309082,
89
- "eval_pen_wer": 0.34514653099587383,
90
- "eval_runtime": 36.4973,
91
- "eval_samples_per_second": 7.425,
92
- "eval_steps_per_second": 0.932,
93
- "eval_wer": 0.5530165149983148,
94
- "step": 677
95
- },
96
- {
97
- "epoch": 6.0,
98
- "grad_norm": 11.025650978088379,
99
- "learning_rate": 3.620535714285714e-05,
100
- "loss": 0.7769,
101
- "step": 813
102
- },
103
- {
104
- "epoch": 6.0,
105
- "eval_loss": 0.9775798320770264,
106
- "eval_pen_wer": 0.32710190850231297,
107
- "eval_runtime": 36.7174,
108
- "eval_samples_per_second": 7.381,
109
- "eval_steps_per_second": 0.926,
110
- "eval_wer": 0.5332659251769464,
111
- "step": 813
112
- },
113
- {
114
- "epoch": 6.996309963099631,
115
- "grad_norm": 6.112392425537109,
116
- "learning_rate": 3.0178571428571427e-05,
117
- "loss": 0.7,
118
- "step": 948
119
- },
120
- {
121
- "epoch": 6.996309963099631,
122
- "eval_loss": 0.9915932416915894,
123
- "eval_pen_wer": 0.3124926266483397,
124
- "eval_runtime": 36.3976,
125
- "eval_samples_per_second": 7.446,
126
- "eval_steps_per_second": 0.934,
127
- "eval_wer": 0.5078530502190766,
128
- "step": 948
129
- },
130
- {
131
- "epoch": 8.0,
132
- "grad_norm": 17.379560470581055,
133
- "learning_rate": 2.4107142857142858e-05,
134
- "loss": 0.6065,
135
- "step": 1084
136
- },
137
- {
138
- "epoch": 8.0,
139
- "eval_loss": 0.992123544216156,
140
- "eval_pen_wer": 0.31970698851386425,
141
- "eval_runtime": 36.1353,
142
- "eval_samples_per_second": 7.5,
143
- "eval_steps_per_second": 0.941,
144
- "eval_wer": 0.5029322548028311,
145
- "step": 1084
146
- },
147
- {
148
- "epoch": 8.99630996309963,
149
- "grad_norm": 7.368852615356445,
150
- "learning_rate": 1.8080357142857144e-05,
151
- "loss": 0.5375,
152
- "step": 1219
153
- },
154
- {
155
- "epoch": 8.99630996309963,
156
- "eval_loss": 0.984150230884552,
157
- "eval_pen_wer": 0.302135588075932,
158
- "eval_runtime": 36.9038,
159
- "eval_samples_per_second": 7.343,
160
- "eval_steps_per_second": 0.921,
161
- "eval_wer": 0.4912032355915066,
162
- "step": 1219
163
- },
164
- {
165
- "epoch": 10.0,
166
- "grad_norm": 9.9882230758667,
167
- "learning_rate": 1.2008928571428573e-05,
168
- "loss": 0.4681,
169
- "step": 1355
170
- },
171
- {
172
- "epoch": 10.0,
173
- "eval_loss": 1.0245816707611084,
174
- "eval_pen_wer": 0.3019771813401745,
175
- "eval_runtime": 36.9691,
176
- "eval_samples_per_second": 7.33,
177
- "eval_steps_per_second": 0.92,
178
- "eval_wer": 0.4895180316818335,
179
- "step": 1355
180
- },
181
- {
182
- "epoch": 10.99630996309963,
183
- "grad_norm": 5.356689453125,
184
- "learning_rate": 5.982142857142858e-06,
185
- "loss": 0.415,
186
- "step": 1490
187
- },
188
- {
189
- "epoch": 10.99630996309963,
190
- "eval_loss": 1.0347157716751099,
191
- "eval_pen_wer": 0.29928239999524137,
192
- "eval_runtime": 36.6987,
193
- "eval_samples_per_second": 7.384,
194
- "eval_steps_per_second": 0.926,
195
- "eval_wer": 0.48230535894843274,
196
- "step": 1490
197
- }
198
- ],
199
- "logging_steps": 500,
200
- "max_steps": 1620,
201
- "num_input_tokens_seen": 0,
202
- "num_train_epochs": 12,
203
- "save_steps": 500,
204
- "stateful_callbacks": {
205
- "TrainerControl": {
206
- "args": {
207
- "should_epoch_stop": false,
208
- "should_evaluate": false,
209
- "should_log": false,
210
- "should_save": true,
211
- "should_training_stop": false
212
- },
213
- "attributes": {}
214
- }
215
- },
216
- "total_flos": 8.432449882085846e+18,
217
- "train_batch_size": 4,
218
- "trial_name": null,
219
- "trial_params": null
220
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
transcription/w2v-bert-darija-finetuned-clean/checkpoint-1490/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2793aaf5af1a42cb015bfef656c097f2acac87a48fffa9d3175eaeceb802e54
3
- size 5304