Zeb
commited on
Commit
·
715480f
1
Parent(s):
251f9ae
Fix normalizer
Browse files
fw57M_Surprisal_thresholdB_32000/tokenizer.json
CHANGED
|
@@ -31,7 +31,14 @@
|
|
| 31 |
"special": true
|
| 32 |
}
|
| 33 |
],
|
| 34 |
-
"normalizer":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 35 |
"pre_tokenizer": {
|
| 36 |
"type": "ByteLevel",
|
| 37 |
"add_prefix_space": true,
|
|
|
|
| 31 |
"special": true
|
| 32 |
}
|
| 33 |
],
|
| 34 |
+
"normalizer": {
|
| 35 |
+
"type": "Sequence",
|
| 36 |
+
"normalizers": [
|
| 37 |
+
{
|
| 38 |
+
"type": "NFD"
|
| 39 |
+
}
|
| 40 |
+
]
|
| 41 |
+
},
|
| 42 |
"pre_tokenizer": {
|
| 43 |
"type": "ByteLevel",
|
| 44 |
"add_prefix_space": true,
|