veryfansome commited on
Commit
735d9e1
·
verified ·
1 Parent(s): 42a0efd

Upload 8 files

Browse files
models/ud_transform_only_20250317/added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[MASK]": 128000
3
+ }
models/ud_transform_only_20250317/config.json ADDED
@@ -0,0 +1,375 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/deberta-v3-base",
3
+ "architectures": [
4
+ "MultiHeadModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 768,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 3072,
12
+ "label_maps": {
13
+ "AdjHead": [
14
+ "3",
15
+ "4+",
16
+ "1",
17
+ "2",
18
+ "O",
19
+ "-3",
20
+ "-2",
21
+ "-1",
22
+ "-4+"
23
+ ],
24
+ "AdvHead": [
25
+ "3",
26
+ "4+",
27
+ "1",
28
+ "2",
29
+ "O",
30
+ "-2",
31
+ "-3+",
32
+ "-1"
33
+ ],
34
+ "Case": [
35
+ "O",
36
+ "Acc",
37
+ "Nom"
38
+ ],
39
+ "CdHead": [
40
+ "3+",
41
+ "1",
42
+ "2",
43
+ "O",
44
+ "-2",
45
+ "-3+",
46
+ "-1"
47
+ ],
48
+ "ConjHead": [
49
+ "3",
50
+ "4+",
51
+ "-1+",
52
+ "1",
53
+ "2",
54
+ "O"
55
+ ],
56
+ "Definite": [
57
+ "O",
58
+ "Ind",
59
+ "Def"
60
+ ],
61
+ "Degree": [
62
+ "O",
63
+ "Sup",
64
+ "Pos",
65
+ "Cmp"
66
+ ],
67
+ "DetHead": [
68
+ "3",
69
+ "4+",
70
+ "1",
71
+ "2",
72
+ "O",
73
+ "-1",
74
+ "-2+"
75
+ ],
76
+ "Gender": [
77
+ "Fem",
78
+ "O",
79
+ "Neut",
80
+ "Masc"
81
+ ],
82
+ "InHead": [
83
+ "3",
84
+ "1",
85
+ "4",
86
+ "2",
87
+ "O",
88
+ "-1",
89
+ "-2+",
90
+ "5+"
91
+ ],
92
+ "ModalHead": [
93
+ "3+",
94
+ "-1+",
95
+ "1",
96
+ "2",
97
+ "O"
98
+ ],
99
+ "Mood": [
100
+ "Imp",
101
+ "O",
102
+ "Ind"
103
+ ],
104
+ "NounHead": [
105
+ "3",
106
+ "-4",
107
+ "4+",
108
+ "1",
109
+ "2",
110
+ "O",
111
+ "-3",
112
+ "-2",
113
+ "-1",
114
+ "-5+"
115
+ ],
116
+ "NumType": [
117
+ "Ord",
118
+ "O",
119
+ "Card",
120
+ "Mult"
121
+ ],
122
+ "Number": [
123
+ "Sing",
124
+ "O",
125
+ "Plur"
126
+ ],
127
+ "Person": [
128
+ "3",
129
+ "2",
130
+ "O",
131
+ "1"
132
+ ],
133
+ "Poss": [
134
+ "O",
135
+ "Yes"
136
+ ],
137
+ "PronType": [
138
+ "Prs",
139
+ "Dem",
140
+ "O",
141
+ "Int",
142
+ "Art",
143
+ "Rel"
144
+ ],
145
+ "PronounHead": [
146
+ "3+",
147
+ "1",
148
+ "2",
149
+ "O",
150
+ "-1",
151
+ "-2+"
152
+ ],
153
+ "Reflex": [
154
+ "O",
155
+ "Yes"
156
+ ],
157
+ "Tense": [
158
+ "Pres",
159
+ "O",
160
+ "Past"
161
+ ],
162
+ "ToHead": [
163
+ "2+",
164
+ "O",
165
+ "-1+",
166
+ "1"
167
+ ],
168
+ "Typo": [
169
+ "O",
170
+ "Yes"
171
+ ],
172
+ "VerbForm": [
173
+ "Part",
174
+ "O",
175
+ "Inf",
176
+ "Ger",
177
+ "Fin"
178
+ ],
179
+ "VerbHead": [
180
+ "3",
181
+ "-4",
182
+ "4+",
183
+ "1",
184
+ "2",
185
+ "O",
186
+ "-3",
187
+ "-2",
188
+ "-1",
189
+ "-5+"
190
+ ],
191
+ "WhHead": [
192
+ "3",
193
+ "4+",
194
+ "1",
195
+ "2",
196
+ "O",
197
+ "-1",
198
+ "-2+"
199
+ ],
200
+ "deprel": [
201
+ "cc",
202
+ "det",
203
+ "amod",
204
+ "nummod",
205
+ "expl",
206
+ "discourse",
207
+ "nsubj",
208
+ "compound",
209
+ "csubj:pass",
210
+ "root",
211
+ "nmod:poss",
212
+ "flat",
213
+ "flat:foreign",
214
+ "obl:npmod",
215
+ "reparandum",
216
+ "csubj",
217
+ "acl",
218
+ "obj",
219
+ "ccomp",
220
+ "aux:pass",
221
+ "compound:prt",
222
+ "nmod:npmod",
223
+ "punct",
224
+ "dep",
225
+ "cc:preconj",
226
+ "aux",
227
+ "nsubj:pass",
228
+ "goeswith",
229
+ "parataxis",
230
+ "nmod:tmod",
231
+ "conj",
232
+ "advmod",
233
+ "nmod",
234
+ "fixed",
235
+ "appos",
236
+ "list",
237
+ "xcomp",
238
+ "mark",
239
+ "advcl",
240
+ "acl:relcl",
241
+ "dislocated",
242
+ "obl",
243
+ "det:predet",
244
+ "orphan",
245
+ "obl:tmod",
246
+ "vocative",
247
+ "case",
248
+ "cop",
249
+ "iobj"
250
+ ],
251
+ "pos": [
252
+ "VERB",
253
+ "PUNCT",
254
+ "NUM",
255
+ "PROPN",
256
+ "CCONJ",
257
+ "ADV",
258
+ "X",
259
+ "SYM",
260
+ "DET",
261
+ "ADJ",
262
+ "PART",
263
+ "PRON",
264
+ "INTJ",
265
+ "ADP",
266
+ "AUX",
267
+ "SCONJ",
268
+ "NOUN"
269
+ ],
270
+ "xpos": [
271
+ "-LRB-",
272
+ "RBS",
273
+ ".",
274
+ "``",
275
+ "NNPS",
276
+ "LS",
277
+ "JJR",
278
+ "POS",
279
+ "$",
280
+ "JJ",
281
+ "NFP",
282
+ "VBN",
283
+ "VBG",
284
+ "PRP$",
285
+ "RBR",
286
+ ":",
287
+ "VBZ",
288
+ "VBP",
289
+ "RB",
290
+ "CD",
291
+ "SYM",
292
+ "WDT",
293
+ "VB",
294
+ "NNP",
295
+ "WP",
296
+ "NN",
297
+ "TO",
298
+ "DT",
299
+ "IN",
300
+ ",",
301
+ "PRP",
302
+ "-RRB-",
303
+ "FW",
304
+ "JJS",
305
+ "''",
306
+ "MD",
307
+ "EX",
308
+ "RP",
309
+ "HYPH",
310
+ "NNS",
311
+ "VBD",
312
+ "WRB",
313
+ "ADD",
314
+ "WP$",
315
+ "CC",
316
+ "PDT",
317
+ "UH"
318
+ ]
319
+ },
320
+ "layer_norm_eps": 1e-07,
321
+ "legacy": true,
322
+ "max_position_embeddings": 512,
323
+ "max_relative_positions": -1,
324
+ "model_type": "deberta-v2",
325
+ "norm_rel_ebd": "layer_norm",
326
+ "num_attention_heads": 12,
327
+ "num_hidden_layers": 12,
328
+ "num_labels_dict": {
329
+ "AdjHead": 9,
330
+ "AdvHead": 8,
331
+ "Case": 3,
332
+ "CdHead": 7,
333
+ "ConjHead": 6,
334
+ "Definite": 3,
335
+ "Degree": 4,
336
+ "DetHead": 7,
337
+ "Gender": 4,
338
+ "InHead": 8,
339
+ "ModalHead": 5,
340
+ "Mood": 3,
341
+ "NounHead": 10,
342
+ "NumType": 4,
343
+ "Number": 3,
344
+ "Person": 4,
345
+ "Poss": 2,
346
+ "PronType": 6,
347
+ "PronounHead": 6,
348
+ "Reflex": 2,
349
+ "Tense": 3,
350
+ "ToHead": 4,
351
+ "Typo": 2,
352
+ "VerbForm": 5,
353
+ "VerbHead": 10,
354
+ "WhHead": 7,
355
+ "deprel": 49,
356
+ "pos": 17,
357
+ "xpos": 47
358
+ },
359
+ "pad_token_id": 0,
360
+ "pooler_dropout": 0,
361
+ "pooler_hidden_act": "gelu",
362
+ "pooler_hidden_size": 768,
363
+ "pos_att_type": [
364
+ "p2c",
365
+ "c2p"
366
+ ],
367
+ "position_biased_input": false,
368
+ "position_buckets": 256,
369
+ "relative_attention": true,
370
+ "share_att_key": true,
371
+ "torch_dtype": "float32",
372
+ "transformers_version": "4.49.0",
373
+ "type_vocab_size": 0,
374
+ "vocab_size": 128100
375
+ }
models/ud_transform_only_20250317/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf5f0912bb6a842c7c65f9356e9a96565b30d7bcf263cc72d8efe6095a55c468
3
+ size 736118392
models/ud_transform_only_20250317/special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": {
9
+ "content": "[UNK]",
10
+ "lstrip": false,
11
+ "normalized": true,
12
+ "rstrip": false,
13
+ "single_word": false
14
+ }
15
+ }
models/ud_transform_only_20250317/spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
models/ud_transform_only_20250317/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
models/ud_transform_only_20250317/tokenizer_config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "[PAD]",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "[CLS]",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "[SEP]",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "[UNK]",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "128000": {
37
+ "content": "[MASK]",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "[CLS]",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "[CLS]",
48
+ "do_lower_case": false,
49
+ "eos_token": "[SEP]",
50
+ "extra_special_tokens": {},
51
+ "mask_token": "[MASK]",
52
+ "model_max_length": 1000000000000000019884624838656,
53
+ "pad_token": "[PAD]",
54
+ "sep_token": "[SEP]",
55
+ "sp_model_kwargs": {},
56
+ "split_by_punct": false,
57
+ "tokenizer_class": "DebertaV2Tokenizer",
58
+ "unk_token": "[UNK]",
59
+ "vocab_type": "spm"
60
+ }
models/ud_transform_only_20250317/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62da87fcc370ea3b1d74cd9b788e0e10af85e4d1bdafc97d3602849881a723bb
3
+ size 5240