veryfansome commited on
Commit
6a56edd
·
verified ·
1 Parent(s): ed6dacc

Upload 9 files

Browse files
models/ud_augmented_jj_rb_types_20250320_v2/README.md ADDED
The diff for this file is too large to render. See raw diff
 
models/ud_augmented_jj_rb_types_20250320_v2/added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[MASK]": 128000
3
+ }
models/ud_augmented_jj_rb_types_20250320_v2/config.json ADDED
@@ -0,0 +1,388 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "models/ud_augmented_jj_rb_types_20250320_v2",
3
+ "architectures": [
4
+ "MultiHeadModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 768,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 3072,
12
+ "label_maps": {
13
+ "AdjGrad": [
14
+ "yes",
15
+ "no",
16
+ "O"
17
+ ],
18
+ "AdjHead": [
19
+ "2",
20
+ "4+",
21
+ "-1",
22
+ "O",
23
+ "-4+",
24
+ "3",
25
+ "1",
26
+ "-2",
27
+ "-3"
28
+ ],
29
+ "AdjPos": [
30
+ "postpositive",
31
+ "attributive",
32
+ "predicative",
33
+ "O"
34
+ ],
35
+ "AdjType": [
36
+ "material",
37
+ "quantifying",
38
+ "color",
39
+ "size",
40
+ "O",
41
+ "quality",
42
+ "purpose",
43
+ "origin",
44
+ "relational",
45
+ "age",
46
+ "shape",
47
+ "limiting"
48
+ ],
49
+ "AdvHead": [
50
+ "-3+",
51
+ "2",
52
+ "4+",
53
+ "-1",
54
+ "O",
55
+ "3",
56
+ "1",
57
+ "-2"
58
+ ],
59
+ "AdvType": [
60
+ "manner",
61
+ "time",
62
+ "negation",
63
+ "conjunctive",
64
+ "frequency",
65
+ "focusing",
66
+ "O",
67
+ "place",
68
+ "degree",
69
+ "disjunct",
70
+ "modal"
71
+ ],
72
+ "Case": [
73
+ "Acc",
74
+ "Nom",
75
+ "O"
76
+ ],
77
+ "CdHead": [
78
+ "-3+",
79
+ "2",
80
+ "-1",
81
+ "3+",
82
+ "O",
83
+ "1",
84
+ "-2"
85
+ ],
86
+ "ConjHead": [
87
+ "2",
88
+ "4+",
89
+ "O",
90
+ "3",
91
+ "1",
92
+ "-1+"
93
+ ],
94
+ "Definite": [
95
+ "Def",
96
+ "Ind",
97
+ "O"
98
+ ],
99
+ "Degree": [
100
+ "Cmp",
101
+ "Pos",
102
+ "Sup",
103
+ "O"
104
+ ],
105
+ "DetHead": [
106
+ "-2+",
107
+ "2",
108
+ "4+",
109
+ "-1",
110
+ "O",
111
+ "3",
112
+ "1"
113
+ ],
114
+ "Gender": [
115
+ "Fem",
116
+ "Masc",
117
+ "Neut",
118
+ "O"
119
+ ],
120
+ "InHead": [
121
+ "4",
122
+ "2",
123
+ "-2+",
124
+ "-1",
125
+ "O",
126
+ "3",
127
+ "5+",
128
+ "1"
129
+ ],
130
+ "MdHead": [
131
+ "2",
132
+ "3+",
133
+ "O",
134
+ "1",
135
+ "-1+"
136
+ ],
137
+ "Mood": [
138
+ "Imp",
139
+ "Ind",
140
+ "O"
141
+ ],
142
+ "NounHead": [
143
+ "2",
144
+ "4+",
145
+ "-5+",
146
+ "-1",
147
+ "O",
148
+ "3",
149
+ "-4",
150
+ "1",
151
+ "-2",
152
+ "-3"
153
+ ],
154
+ "NumType": [
155
+ "Mult",
156
+ "Card",
157
+ "Ord",
158
+ "O"
159
+ ],
160
+ "Number": [
161
+ "Plur",
162
+ "Sing",
163
+ "O"
164
+ ],
165
+ "Person": [
166
+ "3",
167
+ "1",
168
+ "2",
169
+ "O"
170
+ ],
171
+ "PronHead": [
172
+ "-2+",
173
+ "2",
174
+ "-1",
175
+ "3+",
176
+ "O",
177
+ "1"
178
+ ],
179
+ "PronType": [
180
+ "Dem",
181
+ "O",
182
+ "Rel",
183
+ "Int",
184
+ "Prs",
185
+ "Art"
186
+ ],
187
+ "Tense": [
188
+ "Past",
189
+ "Pres",
190
+ "O"
191
+ ],
192
+ "VerbForm": [
193
+ "Ger",
194
+ "Inf",
195
+ "O",
196
+ "Part",
197
+ "Fin"
198
+ ],
199
+ "VerbHead": [
200
+ "2",
201
+ "4+",
202
+ "-5+",
203
+ "-1",
204
+ "O",
205
+ "3",
206
+ "-4",
207
+ "1",
208
+ "-2",
209
+ "-3"
210
+ ],
211
+ "WhHead": [
212
+ "-2+",
213
+ "2",
214
+ "4+",
215
+ "-1",
216
+ "O",
217
+ "3",
218
+ "1"
219
+ ],
220
+ "deprel": [
221
+ "punct",
222
+ "compound",
223
+ "obl",
224
+ "case",
225
+ "obj",
226
+ "nsubj:pass",
227
+ "cc:preconj",
228
+ "list",
229
+ "mark",
230
+ "parataxis",
231
+ "acl",
232
+ "obl:npmod",
233
+ "root",
234
+ "nmod:poss",
235
+ "flat",
236
+ "iobj",
237
+ "nsubj",
238
+ "expl",
239
+ "compound:prt",
240
+ "cop",
241
+ "vocative",
242
+ "nmod",
243
+ "aux:pass",
244
+ "ccomp",
245
+ "det",
246
+ "csubj",
247
+ "obl:tmod",
248
+ "xcomp",
249
+ "aux",
250
+ "discourse",
251
+ "acl:relcl",
252
+ "cc",
253
+ "nmod:npmod",
254
+ "appos",
255
+ "advcl",
256
+ "conj",
257
+ "fixed",
258
+ "advmod",
259
+ "det:predet",
260
+ "amod",
261
+ "nmod:tmod",
262
+ "nummod"
263
+ ],
264
+ "pos": [
265
+ "INTJ",
266
+ "VERB",
267
+ "SYM",
268
+ "PROPN",
269
+ "ADV",
270
+ "AUX",
271
+ "SCONJ",
272
+ "ADJ",
273
+ "DET",
274
+ "NUM",
275
+ "PRON",
276
+ "NOUN",
277
+ "X",
278
+ "CCONJ",
279
+ "ADP",
280
+ "PUNCT",
281
+ "PART"
282
+ ],
283
+ "xpos": [
284
+ "FW",
285
+ "RBR",
286
+ "NNPS",
287
+ "DT",
288
+ "PDT",
289
+ "EX",
290
+ "HYPH",
291
+ "CD",
292
+ "ADD",
293
+ "SYM",
294
+ "PRP",
295
+ "JJR",
296
+ "MD",
297
+ "WDT",
298
+ "JJ",
299
+ "RB",
300
+ "RP",
301
+ "TO",
302
+ "NNP",
303
+ "NN",
304
+ "CC",
305
+ "-RRB-",
306
+ "VBP",
307
+ "WRB",
308
+ "''",
309
+ "IN",
310
+ ":",
311
+ "LS",
312
+ "-LRB-",
313
+ "VBD",
314
+ "VBN",
315
+ ".",
316
+ "VBZ",
317
+ "VBG",
318
+ "WP$",
319
+ "JJS",
320
+ "VB",
321
+ "NNS",
322
+ "``",
323
+ "POS",
324
+ "UH",
325
+ "PRP$",
326
+ "NFP",
327
+ "$",
328
+ "RBS",
329
+ ",",
330
+ "WP"
331
+ ]
332
+ },
333
+ "layer_norm_eps": 1e-07,
334
+ "legacy": true,
335
+ "max_position_embeddings": 512,
336
+ "max_relative_positions": -1,
337
+ "model_type": "deberta-v2",
338
+ "norm_rel_ebd": "layer_norm",
339
+ "num_attention_heads": 12,
340
+ "num_hidden_layers": 12,
341
+ "num_labels_dict": {
342
+ "AdjGrad": 3,
343
+ "AdjHead": 9,
344
+ "AdjPos": 4,
345
+ "AdjType": 12,
346
+ "AdvHead": 8,
347
+ "AdvType": 11,
348
+ "Case": 3,
349
+ "CdHead": 7,
350
+ "ConjHead": 6,
351
+ "Definite": 3,
352
+ "Degree": 4,
353
+ "DetHead": 7,
354
+ "Gender": 4,
355
+ "InHead": 8,
356
+ "MdHead": 5,
357
+ "Mood": 3,
358
+ "NounHead": 10,
359
+ "NumType": 4,
360
+ "Number": 3,
361
+ "Person": 4,
362
+ "PronHead": 6,
363
+ "PronType": 6,
364
+ "Tense": 3,
365
+ "VerbForm": 5,
366
+ "VerbHead": 10,
367
+ "WhHead": 7,
368
+ "deprel": 42,
369
+ "pos": 17,
370
+ "xpos": 47
371
+ },
372
+ "pad_token_id": 0,
373
+ "pooler_dropout": 0,
374
+ "pooler_hidden_act": "gelu",
375
+ "pooler_hidden_size": 768,
376
+ "pos_att_type": [
377
+ "p2c",
378
+ "c2p"
379
+ ],
380
+ "position_biased_input": false,
381
+ "position_buckets": 256,
382
+ "relative_attention": true,
383
+ "share_att_key": true,
384
+ "torch_dtype": "float32",
385
+ "transformers_version": "4.49.0",
386
+ "type_vocab_size": 0,
387
+ "vocab_size": 128100
388
+ }
models/ud_augmented_jj_rb_types_20250320_v2/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57b5dda10a3ea434194a6896dce6e4e1e1290a8bb3db6d753b78b5b7f2b510b7
3
+ size 804672988
models/ud_augmented_jj_rb_types_20250320_v2/special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "[CLS]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "[SEP]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "[MASK]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "[PAD]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "[SEP]",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "[UNK]",
46
+ "lstrip": false,
47
+ "normalized": true,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
models/ud_augmented_jj_rb_types_20250320_v2/spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
models/ud_augmented_jj_rb_types_20250320_v2/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
models/ud_augmented_jj_rb_types_20250320_v2/tokenizer_config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "[PAD]",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "[CLS]",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "[SEP]",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "[UNK]",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "128000": {
37
+ "content": "[MASK]",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "[CLS]",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "[CLS]",
48
+ "do_lower_case": false,
49
+ "eos_token": "[SEP]",
50
+ "extra_special_tokens": {},
51
+ "mask_token": "[MASK]",
52
+ "max_length": 512,
53
+ "model_max_length": 1000000000000000019884624838656,
54
+ "pad_to_multiple_of": null,
55
+ "pad_token": "[PAD]",
56
+ "pad_token_type_id": 0,
57
+ "padding_side": "right",
58
+ "sep_token": "[SEP]",
59
+ "sp_model_kwargs": {},
60
+ "split_by_punct": false,
61
+ "stride": 128,
62
+ "tokenizer_class": "DebertaV2Tokenizer",
63
+ "truncation_side": "right",
64
+ "truncation_strategy": "longest_first",
65
+ "unk_token": "[UNK]",
66
+ "vocab_type": "spm"
67
+ }
models/ud_augmented_jj_rb_types_20250320_v2/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:102841cc592670f6e14d8c04912a42970f142f91a5f4e56047175a6f88708035
3
+ size 5304