Commit ·
b10ffae
1
Parent(s): fde602a
add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"
|
|
|
|
| 1 |
+
{"৮": 0, "্": 1, "ফ": 2, "জ": 3, "ল": 4, "থ": 5, "৬": 6, "য": 7, "খ": 8, "উ": 9, "ূ": 10, "ং": 11, "ই": 12, "ড": 13, "প": 14, "১": 15, "ঠ": 16, "ও": 17, "গ": 18, "ী": 19, "৩": 20, "ঈ": 21, "ঝ": 22, "ৎ": 23, "ু": 24, "ৃ": 25, "ড়": 26, "এ": 27, "৯": 28, "ণ": 29, "ট": 30, "৭": 31, "ষ": 32, "ৗ": 33, "শ": 34, "দ": 35, "ত": 36, "ছ": 37, "ধ": 38, "ক": 39, "ঁ": 40, "ঋ": 41, "য়": 42, "ৰ": 43, "ব": 44, "র": 45, "ঊ": 46, "ঐ": 47, "৪": 48, "ো": 49, "ঞ": 50, "া": 51, "২": 52, "ম": 53, "আ": 54, "ঙ": 55, "ন": 56, "হ": 57, "ঢ়": 58, "ঢ": 59, "ৌ": 60, "চ": 61, "ি": 62, "ৈ": 63, "ঔ": 64, "ঘ": 65, " ": 66, "।": 67, "০": 68, "৫": 69, "স": 70, "়": 71, "ঃ": 72, "ে": 73, "অ": 74, "ভ": 75, "[UNK]": 76, "[PAD]": 77}
|