IonGrozea commited on
Commit
cc307a3
Β·
verified Β·
1 Parent(s): 17fb248

Restructure: Move files from final_best to root and delete subfolder

Browse files
final_best/added_tokens.json β†’ added_tokens.json RENAMED
File without changes
final_best/config.json DELETED
@@ -1,60 +0,0 @@
1
- {
2
- "activation_dropout": 0.0,
3
- "activation_function": "gelu",
4
- "apply_spec_augment": false,
5
- "architectures": [
6
- "WhisperForConditionalGeneration"
7
- ],
8
- "attention_dropout": 0.0,
9
- "begin_suppress_tokens": null,
10
- "bos_token_id": 50257,
11
- "classifier_proj_size": 256,
12
- "d_model": 512,
13
- "decoder_attention_heads": 8,
14
- "decoder_ffn_dim": 2048,
15
- "decoder_layerdrop": 0.0,
16
- "decoder_layers": 6,
17
- "decoder_start_token_id": 50258,
18
- "dropout": 0.0,
19
- "dtype": "float32",
20
- "encoder_attention_heads": 8,
21
- "encoder_ffn_dim": 2048,
22
- "encoder_layerdrop": 0.0,
23
- "encoder_layers": 6,
24
- "eos_token_id": 50257,
25
- "forced_decoder_ids": [
26
- [
27
- 1,
28
- 50284
29
- ],
30
- [
31
- 2,
32
- 50359
33
- ],
34
- [
35
- 3,
36
- 50363
37
- ]
38
- ],
39
- "init_std": 0.02,
40
- "is_encoder_decoder": true,
41
- "mask_feature_length": 10,
42
- "mask_feature_min_masks": 0,
43
- "mask_feature_prob": 0.0,
44
- "mask_time_length": 10,
45
- "mask_time_min_masks": 2,
46
- "mask_time_prob": 0.05,
47
- "max_length": null,
48
- "max_source_positions": 1500,
49
- "max_target_positions": 448,
50
- "median_filter_width": 7,
51
- "model_type": "whisper",
52
- "num_hidden_layers": 6,
53
- "num_mel_bins": 80,
54
- "pad_token_id": 50257,
55
- "scale_embedding": false,
56
- "transformers_version": "4.57.0",
57
- "use_cache": false,
58
- "use_weighted_layer_sum": false,
59
- "vocab_size": 51865
60
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
final_best/generation_config.json DELETED
@@ -1,167 +0,0 @@
1
- {
2
- "alignment_heads": [
3
- [
4
- 3,
5
- 1
6
- ],
7
- [
8
- 4,
9
- 2
10
- ],
11
- [
12
- 4,
13
- 3
14
- ],
15
- [
16
- 4,
17
- 7
18
- ],
19
- [
20
- 5,
21
- 1
22
- ],
23
- [
24
- 5,
25
- 2
26
- ],
27
- [
28
- 5,
29
- 4
30
- ],
31
- [
32
- 5,
33
- 6
34
- ]
35
- ],
36
- "begin_suppress_tokens": [
37
- 220,
38
- 50257
39
- ],
40
- "bos_token_id": 50257,
41
- "decoder_start_token_id": 50258,
42
- "eos_token_id": 50257,
43
- "forced_decoder_ids": [
44
- [
45
- 1,
46
- null
47
- ],
48
- [
49
- 2,
50
- 50359
51
- ]
52
- ],
53
- "is_multilingual": true,
54
- "lang_to_id": {
55
- "<|af|>": 50327,
56
- "<|am|>": 50334,
57
- "<|ar|>": 50272,
58
- "<|as|>": 50350,
59
- "<|az|>": 50304,
60
- "<|ba|>": 50355,
61
- "<|be|>": 50330,
62
- "<|bg|>": 50292,
63
- "<|bn|>": 50302,
64
- "<|bo|>": 50347,
65
- "<|br|>": 50309,
66
- "<|bs|>": 50315,
67
- "<|ca|>": 50270,
68
- "<|cs|>": 50283,
69
- "<|cy|>": 50297,
70
- "<|da|>": 50285,
71
- "<|de|>": 50261,
72
- "<|el|>": 50281,
73
- "<|en|>": 50259,
74
- "<|es|>": 50262,
75
- "<|et|>": 50307,
76
- "<|eu|>": 50310,
77
- "<|fa|>": 50300,
78
- "<|fi|>": 50277,
79
- "<|fo|>": 50338,
80
- "<|fr|>": 50265,
81
- "<|gl|>": 50319,
82
- "<|gu|>": 50333,
83
- "<|haw|>": 50352,
84
- "<|ha|>": 50354,
85
- "<|he|>": 50279,
86
- "<|hi|>": 50276,
87
- "<|hr|>": 50291,
88
- "<|ht|>": 50339,
89
- "<|hu|>": 50286,
90
- "<|hy|>": 50312,
91
- "<|id|>": 50275,
92
- "<|is|>": 50311,
93
- "<|it|>": 50274,
94
- "<|ja|>": 50266,
95
- "<|jw|>": 50356,
96
- "<|ka|>": 50329,
97
- "<|kk|>": 50316,
98
- "<|km|>": 50323,
99
- "<|kn|>": 50306,
100
- "<|ko|>": 50264,
101
- "<|la|>": 50294,
102
- "<|lb|>": 50345,
103
- "<|ln|>": 50353,
104
- "<|lo|>": 50336,
105
- "<|lt|>": 50293,
106
- "<|lv|>": 50301,
107
- "<|mg|>": 50349,
108
- "<|mi|>": 50295,
109
- "<|mk|>": 50308,
110
- "<|ml|>": 50296,
111
- "<|mn|>": 50314,
112
- "<|mr|>": 50320,
113
- "<|ms|>": 50282,
114
- "<|mt|>": 50343,
115
- "<|my|>": 50346,
116
- "<|ne|>": 50313,
117
- "<|nl|>": 50271,
118
- "<|nn|>": 50342,
119
- "<|no|>": 50288,
120
- "<|oc|>": 50328,
121
- "<|pa|>": 50321,
122
- "<|pl|>": 50269,
123
- "<|ps|>": 50340,
124
- "<|pt|>": 50267,
125
- "<|ro|>": 50284,
126
- "<|ru|>": 50263,
127
- "<|sa|>": 50344,
128
- "<|sd|>": 50332,
129
- "<|si|>": 50322,
130
- "<|sk|>": 50298,
131
- "<|sl|>": 50305,
132
- "<|sn|>": 50324,
133
- "<|so|>": 50326,
134
- "<|sq|>": 50317,
135
- "<|sr|>": 50303,
136
- "<|su|>": 50357,
137
- "<|sv|>": 50273,
138
- "<|sw|>": 50318,
139
- "<|ta|>": 50287,
140
- "<|te|>": 50299,
141
- "<|tg|>": 50331,
142
- "<|th|>": 50289,
143
- "<|tk|>": 50341,
144
- "<|tl|>": 50348,
145
- "<|tr|>": 50268,
146
- "<|tt|>": 50351,
147
- "<|uk|>": 50280,
148
- "<|ur|>": 50290,
149
- "<|uz|>": 50337,
150
- "<|vi|>": 50278,
151
- "<|yi|>": 50335,
152
- "<|yo|>": 50325,
153
- "<|zh|>": 50260
154
- },
155
- "max_initial_timestamp_index": 50,
156
- "max_length": 448,
157
- "no_timestamps_token_id": 50363,
158
- "pad_token_id": 50257,
159
- "prev_sot_token_id": 50361,
160
- "return_timestamps": false,
161
- "suppress_tokens": [],
162
- "task_to_id": {
163
- "transcribe": 50359,
164
- "translate": 50358
165
- },
166
- "transformers_version": "4.57.0"
167
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
final_best/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8f322db62b7f93d8c1575b22e5162ee15b30a3acb85f6cf40a1f1a039fa2869
3
- size 290403936
 
 
 
 
final_best/preprocessor_config.json DELETED
@@ -1,15 +0,0 @@
1
- {
2
- "chunk_length": 30,
3
- "dither": 0.0,
4
- "feature_extractor_type": "WhisperFeatureExtractor",
5
- "feature_size": 80,
6
- "hop_length": 160,
7
- "n_fft": 400,
8
- "n_samples": 480000,
9
- "nb_max_frames": 3000,
10
- "padding_side": "right",
11
- "padding_value": 0.0,
12
- "processor_class": "WhisperProcessor",
13
- "return_attention_mask": false,
14
- "sampling_rate": 16000
15
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
final_best/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:23700856d88d253a23832bbde43219c30963594a3e78343d0ce8b1d2f10e957b
3
- size 6033
 
 
 
 
final_best/merges.txt β†’ merges.txt RENAMED
File without changes
final_best/normalizer.json β†’ normalizer.json RENAMED
File without changes
final_best/special_tokens_map.json β†’ special_tokens_map.json RENAMED
File without changes
final_best/tokenizer.json β†’ tokenizer.json RENAMED
File without changes
final_best/tokenizer_config.json β†’ tokenizer_config.json RENAMED
File without changes
final_best/vocab.json β†’ vocab.json RENAMED
File without changes