karmaUI commited on
Commit
5bdc99d
·
verified ·
1 Parent(s): 8e9b138

Upload Shade V7 PhoneticDeBERTa ONNX model

Browse files
Files changed (6) hide show
  1. ShadeV7.onnx +3 -0
  2. config.json +93 -0
  3. label_map.json +83 -0
  4. phonetic_config.json +25 -0
  5. tokenizer.json +0 -0
  6. tokenizer_config.json +18 -0
ShadeV7.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd0a12944f5ea4e00869dfc86f6051f00148cd3a90b8b313bebe66f5554cb7d0
3
+ size 284318923
config.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "PhoneticDeBERTa"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 1,
7
+ "dtype": "float32",
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 384,
12
+ "id2label": {
13
+ "0": "O",
14
+ "1": "B-PERSON",
15
+ "2": "I-PERSON",
16
+ "3": "B-ORG",
17
+ "4": "I-ORG",
18
+ "5": "B-EMAIL",
19
+ "6": "I-EMAIL",
20
+ "7": "B-PHONE",
21
+ "8": "I-PHONE",
22
+ "9": "B-MONEY",
23
+ "10": "I-MONEY",
24
+ "11": "B-DATE",
25
+ "12": "I-DATE",
26
+ "13": "B-ADDRESS",
27
+ "14": "I-ADDRESS",
28
+ "15": "B-GOVID",
29
+ "16": "I-GOVID",
30
+ "17": "B-BANKACCT",
31
+ "18": "I-BANKACCT",
32
+ "19": "B-CARD",
33
+ "20": "I-CARD",
34
+ "21": "B-IPADDR",
35
+ "22": "I-IPADDR",
36
+ "23": "B-CASE",
37
+ "24": "I-CASE"
38
+ },
39
+ "initializer_range": 0.02,
40
+ "intermediate_size": 1536,
41
+ "label2id": {
42
+ "B-ADDRESS": 13,
43
+ "B-BANKACCT": 17,
44
+ "B-CARD": 19,
45
+ "B-CASE": 23,
46
+ "B-DATE": 11,
47
+ "B-EMAIL": 5,
48
+ "B-GOVID": 15,
49
+ "B-IPADDR": 21,
50
+ "B-MONEY": 9,
51
+ "B-ORG": 3,
52
+ "B-PERSON": 1,
53
+ "B-PHONE": 7,
54
+ "I-ADDRESS": 14,
55
+ "I-BANKACCT": 18,
56
+ "I-CARD": 20,
57
+ "I-CASE": 24,
58
+ "I-DATE": 12,
59
+ "I-EMAIL": 6,
60
+ "I-GOVID": 16,
61
+ "I-IPADDR": 22,
62
+ "I-MONEY": 10,
63
+ "I-ORG": 4,
64
+ "I-PERSON": 2,
65
+ "I-PHONE": 8,
66
+ "O": 0
67
+ },
68
+ "layer_norm_eps": 1e-07,
69
+ "legacy": true,
70
+ "max_position_embeddings": 512,
71
+ "max_relative_positions": -1,
72
+ "model_type": "deberta-v2",
73
+ "norm_rel_ebd": "layer_norm",
74
+ "num_attention_heads": 6,
75
+ "num_hidden_layers": 12,
76
+ "pad_token_id": 0,
77
+ "pooler_dropout": 0,
78
+ "pooler_hidden_act": "gelu",
79
+ "pooler_hidden_size": 384,
80
+ "pos_att_type": [
81
+ "p2c",
82
+ "c2p"
83
+ ],
84
+ "position_biased_input": false,
85
+ "position_buckets": 256,
86
+ "relative_attention": true,
87
+ "share_att_key": true,
88
+ "tie_word_embeddings": true,
89
+ "transformers_version": "5.1.0",
90
+ "type_vocab_size": 0,
91
+ "use_cache": false,
92
+ "vocab_size": 128100
93
+ }
label_map.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "labels": [
3
+ "O",
4
+ "B-PERSON",
5
+ "I-PERSON",
6
+ "B-ORG",
7
+ "I-ORG",
8
+ "B-EMAIL",
9
+ "I-EMAIL",
10
+ "B-PHONE",
11
+ "I-PHONE",
12
+ "B-MONEY",
13
+ "I-MONEY",
14
+ "B-DATE",
15
+ "I-DATE",
16
+ "B-ADDRESS",
17
+ "I-ADDRESS",
18
+ "B-GOVID",
19
+ "I-GOVID",
20
+ "B-BANKACCT",
21
+ "I-BANKACCT",
22
+ "B-CARD",
23
+ "I-CARD",
24
+ "B-IPADDR",
25
+ "I-IPADDR",
26
+ "B-CASE",
27
+ "I-CASE"
28
+ ],
29
+ "label2id": {
30
+ "O": 0,
31
+ "B-PERSON": 1,
32
+ "I-PERSON": 2,
33
+ "B-ORG": 3,
34
+ "I-ORG": 4,
35
+ "B-EMAIL": 5,
36
+ "I-EMAIL": 6,
37
+ "B-PHONE": 7,
38
+ "I-PHONE": 8,
39
+ "B-MONEY": 9,
40
+ "I-MONEY": 10,
41
+ "B-DATE": 11,
42
+ "I-DATE": 12,
43
+ "B-ADDRESS": 13,
44
+ "I-ADDRESS": 14,
45
+ "B-GOVID": 15,
46
+ "I-GOVID": 16,
47
+ "B-BANKACCT": 17,
48
+ "I-BANKACCT": 18,
49
+ "B-CARD": 19,
50
+ "I-CARD": 20,
51
+ "B-IPADDR": 21,
52
+ "I-IPADDR": 22,
53
+ "B-CASE": 23,
54
+ "I-CASE": 24
55
+ },
56
+ "id2label": {
57
+ "0": "O",
58
+ "1": "B-PERSON",
59
+ "2": "I-PERSON",
60
+ "3": "B-ORG",
61
+ "4": "I-ORG",
62
+ "5": "B-EMAIL",
63
+ "6": "I-EMAIL",
64
+ "7": "B-PHONE",
65
+ "8": "I-PHONE",
66
+ "9": "B-MONEY",
67
+ "10": "I-MONEY",
68
+ "11": "B-DATE",
69
+ "12": "I-DATE",
70
+ "13": "B-ADDRESS",
71
+ "14": "I-ADDRESS",
72
+ "15": "B-GOVID",
73
+ "16": "I-GOVID",
74
+ "17": "B-BANKACCT",
75
+ "18": "I-BANKACCT",
76
+ "19": "B-CARD",
77
+ "20": "I-CARD",
78
+ "21": "B-IPADDR",
79
+ "22": "I-IPADDR",
80
+ "23": "B-CASE",
81
+ "24": "I-CASE"
82
+ }
83
+ }
phonetic_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "phon_chars": [
3
+ "0",
4
+ "A",
5
+ "F",
6
+ "H",
7
+ "J",
8
+ "K",
9
+ "L",
10
+ "M",
11
+ "N",
12
+ "P",
13
+ "R",
14
+ "S",
15
+ "T",
16
+ "X",
17
+ " "
18
+ ],
19
+ "phon_special": [
20
+ "[PAD]",
21
+ "[UNK]"
22
+ ],
23
+ "phon_dim": 32,
24
+ "max_phon_len": 6
25
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "backend": "tokenizers",
4
+ "bos_token": "[CLS]",
5
+ "cls_token": "[CLS]",
6
+ "do_lower_case": false,
7
+ "eos_token": "[SEP]",
8
+ "is_local": true,
9
+ "mask_token": "[MASK]",
10
+ "model_max_length": 1000000000000000019884624838656,
11
+ "pad_token": "[PAD]",
12
+ "sep_token": "[SEP]",
13
+ "split_by_punct": false,
14
+ "tokenizer_class": "DebertaV2Tokenizer",
15
+ "unk_id": 3,
16
+ "unk_token": "[UNK]",
17
+ "vocab_type": "spm"
18
+ }