Upload tokenizer
Browse files- special_tokens_map.json +28 -4
special_tokens_map.json
CHANGED
|
@@ -103,8 +103,32 @@
|
|
| 103 |
"<unk_101>",
|
| 104 |
"<unk_102>"
|
| 105 |
],
|
| 106 |
-
"eos_token":
|
| 107 |
-
|
| 108 |
-
|
| 109 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 110 |
}
|
|
|
|
| 103 |
"<unk_101>",
|
| 104 |
"<unk_102>"
|
| 105 |
],
|
| 106 |
+
"eos_token": {
|
| 107 |
+
"content": "</s>",
|
| 108 |
+
"lstrip": false,
|
| 109 |
+
"normalized": false,
|
| 110 |
+
"rstrip": false,
|
| 111 |
+
"single_word": false
|
| 112 |
+
},
|
| 113 |
+
"mask_token": {
|
| 114 |
+
"content": "<mask_2>",
|
| 115 |
+
"lstrip": false,
|
| 116 |
+
"normalized": false,
|
| 117 |
+
"rstrip": false,
|
| 118 |
+
"single_word": false
|
| 119 |
+
},
|
| 120 |
+
"pad_token": {
|
| 121 |
+
"content": "<pad>",
|
| 122 |
+
"lstrip": false,
|
| 123 |
+
"normalized": false,
|
| 124 |
+
"rstrip": false,
|
| 125 |
+
"single_word": false
|
| 126 |
+
},
|
| 127 |
+
"unk_token": {
|
| 128 |
+
"content": "<unk>",
|
| 129 |
+
"lstrip": false,
|
| 130 |
+
"normalized": false,
|
| 131 |
+
"rstrip": false,
|
| 132 |
+
"single_word": false
|
| 133 |
+
}
|
| 134 |
}
|