veryfansome commited on
Commit
b2593c3
·
verified ·
1 Parent(s): 0cdb887

Upload 8 files

Browse files
models/conll2012_en12_20250305/added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[MASK]": 128000
3
+ }
models/conll2012_en12_20250305/config.json ADDED
@@ -0,0 +1,138 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/deberta-v3-base",
3
+ "architectures": [
4
+ "MultiHeadModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 768,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 3072,
12
+ "label_maps": {
13
+ "ner_tags": [
14
+ "I-DATE",
15
+ "B-ORDINAL",
16
+ "B-CARDINAL",
17
+ "O",
18
+ "B-QUANTITY",
19
+ "I-FAC",
20
+ "B-GPE",
21
+ "I-LAW",
22
+ "B-PERSON",
23
+ "B-LAW",
24
+ "B-NORP",
25
+ "B-LOC",
26
+ "I-ORDINAL",
27
+ "B-ORG",
28
+ "B-LANGUAGE",
29
+ "B-DATE",
30
+ "I-EVENT",
31
+ "I-GPE",
32
+ "I-QUANTITY",
33
+ "I-MONEY",
34
+ "I-CARDINAL",
35
+ "B-MONEY",
36
+ "I-PERCENT",
37
+ "B-TIME",
38
+ "I-WORK_OF_ART",
39
+ "I-PERSON",
40
+ "B-EVENT",
41
+ "I-NORP",
42
+ "I-LOC",
43
+ "I-PRODUCT",
44
+ "I-TIME",
45
+ "B-PRODUCT",
46
+ "B-PERCENT",
47
+ "B-WORK_OF_ART",
48
+ "I-LANGUAGE",
49
+ "I-ORG",
50
+ "B-FAC"
51
+ ],
52
+ "pos_tags": [
53
+ "WRB",
54
+ "PRP$",
55
+ "RBR",
56
+ "MD",
57
+ "PRP",
58
+ "RB",
59
+ "-LRB-",
60
+ "``",
61
+ ".",
62
+ "NN",
63
+ ":",
64
+ "VBP",
65
+ "WP$",
66
+ "*",
67
+ "VBN",
68
+ "CC",
69
+ "VBZ",
70
+ "POS",
71
+ "CD",
72
+ "NNS",
73
+ "WDT",
74
+ "LS",
75
+ "ADD",
76
+ "VERB",
77
+ "VBD",
78
+ "JJR",
79
+ "IN",
80
+ "NNPS",
81
+ "NNP",
82
+ "UH",
83
+ "RBS",
84
+ "JJ",
85
+ "FW",
86
+ "NFP",
87
+ "-RRB-",
88
+ "VBG",
89
+ "EX",
90
+ ",",
91
+ "DT",
92
+ "''",
93
+ "TO",
94
+ "SYM",
95
+ "JJS",
96
+ "RP",
97
+ "$",
98
+ "PDT",
99
+ "HYPH",
100
+ "XX",
101
+ "VB",
102
+ "WP"
103
+ ],
104
+ "verb_predicate": [
105
+ "O",
106
+ "Yes"
107
+ ]
108
+ },
109
+ "layer_norm_eps": 1e-07,
110
+ "legacy": true,
111
+ "max_position_embeddings": 512,
112
+ "max_relative_positions": -1,
113
+ "model_type": "deberta-v2",
114
+ "norm_rel_ebd": "layer_norm",
115
+ "num_attention_heads": 12,
116
+ "num_hidden_layers": 12,
117
+ "num_labels_dict": {
118
+ "ner_tags": 37,
119
+ "pos_tags": 50,
120
+ "verb_predicate": 2
121
+ },
122
+ "pad_token_id": 0,
123
+ "pooler_dropout": 0,
124
+ "pooler_hidden_act": "gelu",
125
+ "pooler_hidden_size": 768,
126
+ "pos_att_type": [
127
+ "p2c",
128
+ "c2p"
129
+ ],
130
+ "position_biased_input": false,
131
+ "position_buckets": 256,
132
+ "relative_attention": true,
133
+ "share_att_key": true,
134
+ "torch_dtype": "float32",
135
+ "transformers_version": "4.49.0",
136
+ "type_vocab_size": 0,
137
+ "vocab_size": 128100
138
+ }
models/conll2012_en12_20250305/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:250d44765f68ab176dde7a9bb06e6a52c8658c3141e25771a1a2ffdb49cdac0d
3
+ size 735624748
models/conll2012_en12_20250305/special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": {
9
+ "content": "[UNK]",
10
+ "lstrip": false,
11
+ "normalized": true,
12
+ "rstrip": false,
13
+ "single_word": false
14
+ }
15
+ }
models/conll2012_en12_20250305/spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
models/conll2012_en12_20250305/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
models/conll2012_en12_20250305/tokenizer_config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "[PAD]",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "[CLS]",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "[SEP]",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "[UNK]",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "128000": {
37
+ "content": "[MASK]",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "[CLS]",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "[CLS]",
48
+ "do_lower_case": false,
49
+ "eos_token": "[SEP]",
50
+ "extra_special_tokens": {},
51
+ "mask_token": "[MASK]",
52
+ "model_max_length": 1000000000000000019884624838656,
53
+ "pad_token": "[PAD]",
54
+ "sep_token": "[SEP]",
55
+ "sp_model_kwargs": {},
56
+ "split_by_punct": false,
57
+ "tokenizer_class": "DebertaV2Tokenizer",
58
+ "unk_token": "[UNK]",
59
+ "vocab_type": "spm"
60
+ }
models/conll2012_en12_20250305/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:778a691f83fb5dcfe8e9c9a6371dc7f31bf3842f4d67464cc949409d466b4db0
3
+ size 5240