ameforge commited on
Commit
a5c80e8
·
verified ·
1 Parent(s): 85f3fc9

Upload tokenizer_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +42 -0
tokenizer_config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "tokenizer_class": "SentencePieceProcessor",
3
+ "model_type": "bpe",
4
+ "vocab_size": 12000,
5
+ "pad_id": 0,
6
+ "bos_id": 1,
7
+ "eos_id": 2,
8
+ "unk_id": 3,
9
+ "character_coverage": 0.9999,
10
+ "byte_fallback": false,
11
+ "split_digits": false,
12
+ "normalization_rule_name": "identity",
13
+ "reserved_symbols_count": 6806,
14
+ "domains": [
15
+ "ROS",
16
+ "HTTP",
17
+ "MQTT",
18
+ "DB",
19
+ "WORKFLOW",
20
+ "ECOMMERCE",
21
+ "VEHICLE",
22
+ "HOME",
23
+ "CAL",
24
+ "FILE"
25
+ ],
26
+ "structural_tags": [
27
+ "<SCHEMA>",
28
+ "</SCHEMA>",
29
+ "<TASK>",
30
+ "</TASK>",
31
+ "<DOMAIN>",
32
+ "</DOMAIN>",
33
+ "<JSON>",
34
+ "</JSON>",
35
+ "<ACTION>",
36
+ "</ACTION>",
37
+ "<META>",
38
+ "</META>"
39
+ ],
40
+ "license": "apache-2.0",
41
+ "organization": "AMFORGE"
42
+ }