dda71427
/

tokenizer.json

Model card Files Files and versions

dda71427 commited on 21 days ago

Commit

34bf488

·

verified ·

1 Parent(s): d1bf205

Create . tokenizer.json

Files changed (1) hide show

. tokenizer.json +27 -0

. tokenizer.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "version": "1.0",
+  "truncation": null,
+  "padding": null,
+  "added_tokens": [
+    {"id": 0, "special": false, "content": "hello"},
+    {"id": 1, "special": false, "content": "world"},
+    {"id": 2, "special": true, "content": "<unk>"}
+  ],
+  "normalizer": {
+    "type": "BertNormalizer",
+    "clean_text": true,
+    "handle_chinese_chars": true,
+    "strip_accents": null,
+    "lowercase": true
+  },
+  "pre_tokenizer": {"type": "Whitespace"},
+  "model": {
+    "type": "WordLevel",
+    "vocab": {"hello": 0, "world": 1, "<unk>": 2},
+    "unk_token": "<unk>"
+  },
+  "post_processor": {
+    "type": "ByteLevel",
+    "trim_offsets": true
+  }
+}