FireRedTeam commited on
Commit
7029dff
·
verified ·
1 Parent(s): 89a5602

Delete chinese-lert-base-tokenizer

Browse files
chinese-lert-base-tokenizer/README.md DELETED
@@ -1,13 +0,0 @@
1
- ---
2
- language:
3
- - zh
4
- license: "apache-2.0"
5
- ---
6
- ### LERT
7
- LERT is a linguistically-motivated pre-trained language model.
8
-
9
- Further information: https://github.com/ymcui/LERT/blob/main/README_EN.md
10
-
11
- - **LERT: A Linguistically-motivated Pre-trained Language Model**
12
- - *Yiming Cui, Wanxiang Che, Shijin Wang, Ting Liu*
13
- - Paper link: https://arxiv.org/abs/2211.05344
 
 
 
 
 
 
 
 
 
 
 
 
 
 
chinese-lert-base-tokenizer/added_tokens.json DELETED
@@ -1 +0,0 @@
1
- {}
 
 
chinese-lert-base-tokenizer/config.json DELETED
@@ -1,30 +0,0 @@
1
- {
2
- "_name_or_path": ".",
3
- "architectures": [
4
- "BertForMaskedLM"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "directionality": "bidi",
9
- "hidden_act": "gelu",
10
- "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
- "initializer_range": 0.02,
13
- "intermediate_size": 3072,
14
- "layer_norm_eps": 1e-12,
15
- "max_position_embeddings": 512,
16
- "model_type": "bert",
17
- "num_attention_heads": 12,
18
- "num_hidden_layers": 12,
19
- "pad_token_id": 0,
20
- "pooler_fc_size": 768,
21
- "pooler_num_attention_heads": 12,
22
- "pooler_num_fc_layers": 3,
23
- "pooler_size_per_head": 128,
24
- "pooler_type": "first_token_transform",
25
- "position_embedding_type": "absolute",
26
- "transformers_version": "4.16.2",
27
- "type_vocab_size": 2,
28
- "use_cache": true,
29
- "vocab_size": 21128
30
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
chinese-lert-base-tokenizer/special_tokens_map.json DELETED
@@ -1 +0,0 @@
1
- {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
 
 
chinese-lert-base-tokenizer/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
chinese-lert-base-tokenizer/tokenizer_config.json DELETED
@@ -1 +0,0 @@
1
- {"init_inputs": []}
 
 
chinese-lert-base-tokenizer/vocab.txt DELETED
The diff for this file is too large to render. See raw diff