File size: 1,171 Bytes
8a9a2f7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
{
  "char_to_id": {
    "[PAD]": 0,
    "[UNK]": 1,
    "[BOS]": 2,
    "[EOS]": 3,
    "[MASK]": 4,
    " ": 5,
    "ا": 6,
    "ل": 7,
    "ي": 8,
    "م": 9,
    "و": 10,
    "ن": 11,
    "ه": 12,
    "ب": 13,
    "ر": 14,
    "ع": 15,
    "ف": 16,
    "أ": 17,
    "ق": 18,
    "ت": 19,
    "د": 20,
    "ك": 21,
    "ح": 22,
    "ة": 23,
    "س": 24,
    "ج": 25,
    "إ": 26,
    "ص": 27,
    "ذ": 28,
    "ى": 29,
    "خ": 30,
    "ش": 31,
    "ث": 32,
    "ض": 33,
    "ط": 34,
    "ز": 35,
    ":": 36,
    "غ": 37,
    "ء": 38,
    "ئ": 39,
    "ظ": 40,
    "؛": 41,
    "آ": 42,
    "-": 43,
    "ؤ": 44,
    ",": 45,
    "ٰ": 46,
    "ۚ": 47,
    "ۖ": 48,
    "ۗ": 49
  },
  "vocab_size": 50,
  "special_tokens": {
    "PAD": 0,
    "UNK": 1,
    "BOS": 2,
    "EOS": 3,
    "MASK": 4,
    "SPACE": 5
  },
  "diacritic_classes": [
    "NO_DIACRITIC",
    "FATHA",
    "FATHATAN",
    "DAMMA",
    "DAMMATAN",
    "KASRA",
    "KASRATAN",
    "SUKUN",
    "SHADDA",
    "SHADDA_FATHA",
    "SHADDA_FATHATAN",
    "SHADDA_DAMMA",
    "SHADDA_DAMMATAN",
    "SHADDA_KASRA",
    "SHADDA_KASRATAN"
  ],
  "num_labels": 15
}