Samuael commited on
Commit
d2c8b01
·
verified ·
1 Parent(s): 238c235

Samuael/amBART_1000

Browse files
README.md CHANGED
@@ -1,4 +1,5 @@
1
  ---
 
2
  tags:
3
  - generated_from_trainer
4
  model-index:
@@ -11,7 +12,17 @@ should probably proofread and complete it, then remove this comment. -->
11
 
12
  # amBART
13
 
14
- This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 
 
 
 
 
 
 
 
 
 
15
 
16
  ## Model description
17
 
@@ -30,17 +41,18 @@ More information needed
30
  ### Training hyperparameters
31
 
32
  The following hyperparameters were used during training:
33
- - learning_rate: 0.005
34
- - train_batch_size: 64
35
- - eval_batch_size: 64
36
  - seed: 42
37
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
38
  - lr_scheduler_type: linear
39
- - num_epochs: 30
 
40
 
41
  ### Framework versions
42
 
43
- - Transformers 4.38.1
44
  - Pytorch 2.1.0+cu121
45
  - Datasets 2.18.0
46
  - Tokenizers 0.15.2
 
1
  ---
2
+ base_model: Samuael/amBART_1000
3
  tags:
4
  - generated_from_trainer
5
  model-index:
 
12
 
13
  # amBART
14
 
15
+ This model is a fine-tuned version of [Samuael/amBART_1000](https://huggingface.co/Samuael/amBART_1000) on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - eval_loss: 2.9935
18
+ - eval_wer: 0.9817
19
+ - eval_cer: 0.7707
20
+ - eval_bleu: 0.7418
21
+ - eval_runtime: 9.129
22
+ - eval_samples_per_second: 39.325
23
+ - eval_steps_per_second: 0.329
24
+ - epoch: 3.0
25
+ - step: 2127
26
 
27
  ## Model description
28
 
 
41
  ### Training hyperparameters
42
 
43
  The following hyperparameters were used during training:
44
+ - learning_rate: 0.002
45
+ - train_batch_size: 128
46
+ - eval_batch_size: 128
47
  - seed: 42
48
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
49
  - lr_scheduler_type: linear
50
+ - num_epochs: 50
51
+ - mixed_precision_training: Native AMP
52
 
53
  ### Framework versions
54
 
55
+ - Transformers 4.38.2
56
  - Pytorch 2.1.0+cu121
57
  - Datasets 2.18.0
58
  - Tokenizers 0.15.2
config.json CHANGED
@@ -1,8 +1,9 @@
1
  {
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "gelu",
4
  "architectures": [
5
- "MBartModel"
6
  ],
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 0,
@@ -30,5 +31,5 @@
30
  "torch_dtype": "float32",
31
  "transformers_version": "4.38.2",
32
  "use_cache": true,
33
- "vocab_size": 260
34
  }
 
1
  {
2
+ "_name_or_path": "Samuael/amBART_1000",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
6
+ "MBartForConditionalGeneration"
7
  ],
8
  "attention_dropout": 0.0,
9
  "bos_token_id": 0,
 
31
  "torch_dtype": "float32",
32
  "transformers_version": "4.38.2",
33
  "use_cache": true,
34
+ "vocab_size": 1027
35
  }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 0,
3
+ "eos_token_id": 2,
4
+ "forced_eos_token_id": 2,
5
+ "max_length": 300,
6
+ "pad_token_id": 1,
7
+ "transformers_version": "4.38.2"
8
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57edf11149bec1eb85c6a8a425f6a023546e7838de010875b91419bea4fadbef
3
- size 179236624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1504bcd0758ac82ab09f78650ebc0c7c431edde67e78c5fb92b4befcf30c490e
3
+ size 180813204
sentencepiece.bpe.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc579c42f174c74d5a56bc4a02e6eef7759711b9415d2fd1bf4810683bdb69c5
3
- size 240450
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b2c9b3910462e773a7ace377cb26a40053dcfe4054d8eb8ecc5460495a93d9b
3
+ size 253575
special_tokens_map.json CHANGED
@@ -1,12 +1,73 @@
1
  {
2
  "additional_special_tokens": [
3
  "ar_AR",
4
- "cs_CZ"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  ],
6
- "bos_token": "<s>",
7
- "cls_token": "<s>",
8
- "eos_token": "</s>",
9
- "pad_token": "<pad>",
10
- "sep_token": "</s>",
11
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  }
 
1
  {
2
  "additional_special_tokens": [
3
  "ar_AR",
4
+ "cs_CZ",
5
+ "de_DE",
6
+ "en_XX",
7
+ "es_XX",
8
+ "et_EE",
9
+ "fi_FI",
10
+ "fr_XX",
11
+ "gu_IN",
12
+ "hi_IN",
13
+ "it_IT",
14
+ "ja_XX",
15
+ "kk_KZ",
16
+ "ko_KR",
17
+ "lt_LT",
18
+ "lv_LV",
19
+ "my_MM",
20
+ "ne_NP",
21
+ "nl_XX",
22
+ "ro_RO",
23
+ "ru_RU",
24
+ "si_LK",
25
+ "tr_TR",
26
+ "vi_VN",
27
+ "zh_CN",
28
+ "▁በኋላ",
29
+ "ብር"
30
  ],
31
+ "bos_token": {
32
+ "content": "<s>",
33
+ "lstrip": false,
34
+ "normalized": false,
35
+ "rstrip": false,
36
+ "single_word": false
37
+ },
38
+ "cls_token": {
39
+ "content": "<s>",
40
+ "lstrip": false,
41
+ "normalized": false,
42
+ "rstrip": false,
43
+ "single_word": false
44
+ },
45
+ "eos_token": {
46
+ "content": "</s>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false
51
+ },
52
+ "pad_token": {
53
+ "content": "<pad>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false
58
+ },
59
+ "sep_token": {
60
+ "content": "</s>",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false
65
+ },
66
+ "unk_token": {
67
+ "content": "<unk>",
68
+ "lstrip": false,
69
+ "normalized": false,
70
+ "rstrip": false,
71
+ "single_word": false
72
+ }
73
  }
tokenizer_config.json CHANGED
@@ -33,7 +33,7 @@
33
  "special": true
34
  },
35
  "234": {
36
- "content": "ar_AR",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
@@ -41,6 +41,22 @@
41
  "special": true
42
  },
43
  "235": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  "content": "cs_CZ",
45
  "lstrip": false,
46
  "normalized": false,
@@ -48,7 +64,7 @@
48
  "single_word": false,
49
  "special": true
50
  },
51
- "236": {
52
  "content": "de_DE",
53
  "lstrip": false,
54
  "normalized": false,
@@ -56,7 +72,7 @@
56
  "single_word": false,
57
  "special": true
58
  },
59
- "237": {
60
  "content": "en_XX",
61
  "lstrip": false,
62
  "normalized": false,
@@ -64,7 +80,7 @@
64
  "single_word": false,
65
  "special": true
66
  },
67
- "238": {
68
  "content": "es_XX",
69
  "lstrip": false,
70
  "normalized": false,
@@ -72,7 +88,7 @@
72
  "single_word": false,
73
  "special": true
74
  },
75
- "239": {
76
  "content": "et_EE",
77
  "lstrip": false,
78
  "normalized": false,
@@ -80,7 +96,7 @@
80
  "single_word": false,
81
  "special": true
82
  },
83
- "240": {
84
  "content": "fi_FI",
85
  "lstrip": false,
86
  "normalized": false,
@@ -88,7 +104,7 @@
88
  "single_word": false,
89
  "special": true
90
  },
91
- "241": {
92
  "content": "fr_XX",
93
  "lstrip": false,
94
  "normalized": false,
@@ -96,7 +112,7 @@
96
  "single_word": false,
97
  "special": true
98
  },
99
- "242": {
100
  "content": "gu_IN",
101
  "lstrip": false,
102
  "normalized": false,
@@ -104,7 +120,7 @@
104
  "single_word": false,
105
  "special": true
106
  },
107
- "243": {
108
  "content": "hi_IN",
109
  "lstrip": false,
110
  "normalized": false,
@@ -112,7 +128,7 @@
112
  "single_word": false,
113
  "special": true
114
  },
115
- "244": {
116
  "content": "it_IT",
117
  "lstrip": false,
118
  "normalized": false,
@@ -120,7 +136,7 @@
120
  "single_word": false,
121
  "special": true
122
  },
123
- "245": {
124
  "content": "ja_XX",
125
  "lstrip": false,
126
  "normalized": false,
@@ -128,7 +144,7 @@
128
  "single_word": false,
129
  "special": true
130
  },
131
- "246": {
132
  "content": "kk_KZ",
133
  "lstrip": false,
134
  "normalized": false,
@@ -136,7 +152,7 @@
136
  "single_word": false,
137
  "special": true
138
  },
139
- "247": {
140
  "content": "ko_KR",
141
  "lstrip": false,
142
  "normalized": false,
@@ -144,7 +160,7 @@
144
  "single_word": false,
145
  "special": true
146
  },
147
- "248": {
148
  "content": "lt_LT",
149
  "lstrip": false,
150
  "normalized": false,
@@ -152,7 +168,7 @@
152
  "single_word": false,
153
  "special": true
154
  },
155
- "249": {
156
  "content": "lv_LV",
157
  "lstrip": false,
158
  "normalized": false,
@@ -160,7 +176,7 @@
160
  "single_word": false,
161
  "special": true
162
  },
163
- "250": {
164
  "content": "my_MM",
165
  "lstrip": false,
166
  "normalized": false,
@@ -168,7 +184,7 @@
168
  "single_word": false,
169
  "special": true
170
  },
171
- "251": {
172
  "content": "ne_NP",
173
  "lstrip": false,
174
  "normalized": false,
@@ -176,7 +192,7 @@
176
  "single_word": false,
177
  "special": true
178
  },
179
- "252": {
180
  "content": "nl_XX",
181
  "lstrip": false,
182
  "normalized": false,
@@ -184,7 +200,7 @@
184
  "single_word": false,
185
  "special": true
186
  },
187
- "253": {
188
  "content": "ro_RO",
189
  "lstrip": false,
190
  "normalized": false,
@@ -192,7 +208,7 @@
192
  "single_word": false,
193
  "special": true
194
  },
195
- "254": {
196
  "content": "ru_RU",
197
  "lstrip": false,
198
  "normalized": false,
@@ -200,7 +216,7 @@
200
  "single_word": false,
201
  "special": true
202
  },
203
- "255": {
204
  "content": "si_LK",
205
  "lstrip": false,
206
  "normalized": false,
@@ -208,7 +224,7 @@
208
  "single_word": false,
209
  "special": true
210
  },
211
- "256": {
212
  "content": "tr_TR",
213
  "lstrip": false,
214
  "normalized": false,
@@ -216,7 +232,7 @@
216
  "single_word": false,
217
  "special": true
218
  },
219
- "257": {
220
  "content": "vi_VN",
221
  "lstrip": false,
222
  "normalized": false,
@@ -224,7 +240,7 @@
224
  "single_word": false,
225
  "special": true
226
  },
227
- "258": {
228
  "content": "zh_CN",
229
  "lstrip": false,
230
  "normalized": false,
@@ -235,7 +251,32 @@
235
  },
236
  "additional_special_tokens": [
237
  "ar_AR",
238
- "cs_CZ"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
239
  ],
240
  "bos_token": "<s>",
241
  "clean_up_tokenization_spaces": true,
@@ -249,6 +290,5 @@
249
  "src_lang": "ar_AR",
250
  "tgt_lang": "cs_CZ",
251
  "tokenizer_class": "MBartTokenizer",
252
- "tokenizer_file": null,
253
  "unk_token": "<unk>"
254
  }
 
33
  "special": true
34
  },
35
  "234": {
36
+ "content": "▁በኋላ",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
 
41
  "special": true
42
  },
43
  "235": {
44
+ "content": "ብር",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "1001": {
52
+ "content": "ar_AR",
53
+ "lstrip": false,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "1002": {
60
  "content": "cs_CZ",
61
  "lstrip": false,
62
  "normalized": false,
 
64
  "single_word": false,
65
  "special": true
66
  },
67
+ "1003": {
68
  "content": "de_DE",
69
  "lstrip": false,
70
  "normalized": false,
 
72
  "single_word": false,
73
  "special": true
74
  },
75
+ "1004": {
76
  "content": "en_XX",
77
  "lstrip": false,
78
  "normalized": false,
 
80
  "single_word": false,
81
  "special": true
82
  },
83
+ "1005": {
84
  "content": "es_XX",
85
  "lstrip": false,
86
  "normalized": false,
 
88
  "single_word": false,
89
  "special": true
90
  },
91
+ "1006": {
92
  "content": "et_EE",
93
  "lstrip": false,
94
  "normalized": false,
 
96
  "single_word": false,
97
  "special": true
98
  },
99
+ "1007": {
100
  "content": "fi_FI",
101
  "lstrip": false,
102
  "normalized": false,
 
104
  "single_word": false,
105
  "special": true
106
  },
107
+ "1008": {
108
  "content": "fr_XX",
109
  "lstrip": false,
110
  "normalized": false,
 
112
  "single_word": false,
113
  "special": true
114
  },
115
+ "1009": {
116
  "content": "gu_IN",
117
  "lstrip": false,
118
  "normalized": false,
 
120
  "single_word": false,
121
  "special": true
122
  },
123
+ "1010": {
124
  "content": "hi_IN",
125
  "lstrip": false,
126
  "normalized": false,
 
128
  "single_word": false,
129
  "special": true
130
  },
131
+ "1011": {
132
  "content": "it_IT",
133
  "lstrip": false,
134
  "normalized": false,
 
136
  "single_word": false,
137
  "special": true
138
  },
139
+ "1012": {
140
  "content": "ja_XX",
141
  "lstrip": false,
142
  "normalized": false,
 
144
  "single_word": false,
145
  "special": true
146
  },
147
+ "1013": {
148
  "content": "kk_KZ",
149
  "lstrip": false,
150
  "normalized": false,
 
152
  "single_word": false,
153
  "special": true
154
  },
155
+ "1014": {
156
  "content": "ko_KR",
157
  "lstrip": false,
158
  "normalized": false,
 
160
  "single_word": false,
161
  "special": true
162
  },
163
+ "1015": {
164
  "content": "lt_LT",
165
  "lstrip": false,
166
  "normalized": false,
 
168
  "single_word": false,
169
  "special": true
170
  },
171
+ "1016": {
172
  "content": "lv_LV",
173
  "lstrip": false,
174
  "normalized": false,
 
176
  "single_word": false,
177
  "special": true
178
  },
179
+ "1017": {
180
  "content": "my_MM",
181
  "lstrip": false,
182
  "normalized": false,
 
184
  "single_word": false,
185
  "special": true
186
  },
187
+ "1018": {
188
  "content": "ne_NP",
189
  "lstrip": false,
190
  "normalized": false,
 
192
  "single_word": false,
193
  "special": true
194
  },
195
+ "1019": {
196
  "content": "nl_XX",
197
  "lstrip": false,
198
  "normalized": false,
 
200
  "single_word": false,
201
  "special": true
202
  },
203
+ "1020": {
204
  "content": "ro_RO",
205
  "lstrip": false,
206
  "normalized": false,
 
208
  "single_word": false,
209
  "special": true
210
  },
211
+ "1021": {
212
  "content": "ru_RU",
213
  "lstrip": false,
214
  "normalized": false,
 
216
  "single_word": false,
217
  "special": true
218
  },
219
+ "1022": {
220
  "content": "si_LK",
221
  "lstrip": false,
222
  "normalized": false,
 
224
  "single_word": false,
225
  "special": true
226
  },
227
+ "1023": {
228
  "content": "tr_TR",
229
  "lstrip": false,
230
  "normalized": false,
 
232
  "single_word": false,
233
  "special": true
234
  },
235
+ "1024": {
236
  "content": "vi_VN",
237
  "lstrip": false,
238
  "normalized": false,
 
240
  "single_word": false,
241
  "special": true
242
  },
243
+ "1025": {
244
  "content": "zh_CN",
245
  "lstrip": false,
246
  "normalized": false,
 
251
  },
252
  "additional_special_tokens": [
253
  "ar_AR",
254
+ "cs_CZ",
255
+ "de_DE",
256
+ "en_XX",
257
+ "es_XX",
258
+ "et_EE",
259
+ "fi_FI",
260
+ "fr_XX",
261
+ "gu_IN",
262
+ "hi_IN",
263
+ "it_IT",
264
+ "ja_XX",
265
+ "kk_KZ",
266
+ "ko_KR",
267
+ "lt_LT",
268
+ "lv_LV",
269
+ "my_MM",
270
+ "ne_NP",
271
+ "nl_XX",
272
+ "ro_RO",
273
+ "ru_RU",
274
+ "si_LK",
275
+ "tr_TR",
276
+ "vi_VN",
277
+ "zh_CN",
278
+ "▁በኋላ",
279
+ "ብር"
280
  ],
281
  "bos_token": "<s>",
282
  "clean_up_tokenization_spaces": true,
 
290
  "src_lang": "ar_AR",
291
  "tgt_lang": "cs_CZ",
292
  "tokenizer_class": "MBartTokenizer",
 
293
  "unk_token": "<unk>"
294
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e53a7bf06d7267874d2691850983fbffe4f8767761a181083359c679d97356d0
3
- size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19be77b3b5f0472323533764679e1f13184f30ee05c97f781d3b916fe948fbe
3
+ size 4984