tameto commited on
Commit
f1347ea
·
verified ·
1 Parent(s): 2856449

Initial kimetsu-style tiny GPT

Browse files
README.md ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - ja
4
+ license: mit
5
+ library_name: transformers
6
+ pipeline_tag: text-generation
7
+ tags:
8
+ - tiny-gpt
9
+ - parody
10
+ - japanese
11
+ - next-token-prediction
12
+ ---
13
+
14
+ # Kimetsu-Style GPT (Tiny)
15
+
16
+ **“鬼滅風”のセリフを生成する超小型デモモデル**(教育/勉強会向け)。
17
+ このノートで、**自作コーパス → トークナイズ → 事前学習 → 生成 → 公開**までを約1時間で再現しています。
18
+
19
+ ## Training
20
+ - Tokenizer: ByteLevel BPE (~5000)
21
+ - Model: GPT2-style decoder-only (layers=2, heads=4, d_model=256, context=128)
22
+ - Optim: AdamW, lr=0.0003, epochs=1, fp16(CUDA)
23
+ - Data: 著作権に配慮した**自作の“鬼滅風”短文**のみ
24
+
25
+ ## Intended Use & Limitations
26
+ - 教育/デモ目的。実運用・安全性は未保証です。
27
+ - 作品の公式セリフや固有名詞は含みません(**パロディ文体のみ**)。
28
+ - 生成物は確率的に不適切/不正確な内容を含む可能性があります。
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "architectures": [
4
+ "GPT2LMHeadModel"
5
+ ],
6
+ "attn_pdrop": 0.1,
7
+ "bos_token_id": 0,
8
+ "dtype": "float32",
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 2,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 128,
15
+ "n_embd": 256,
16
+ "n_head": 4,
17
+ "n_inner": null,
18
+ "n_layer": 2,
19
+ "n_positions": 128,
20
+ "reorder_and_upcast_attn": false,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_by_inverse_layer_idx": false,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "transformers_version": "4.56.1",
30
+ "use_cache": true,
31
+ "vocab_size": 412
32
+ }
corpus_idea.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ This repo accompanies a parody-style Japanese corpus written in the notebook only.
2
+ No official quotes or copyrighted lines are included.
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.56.1"
6
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0afc1c59b629af6065545d201338189d736b716f1a78d5c878209a8abad3c3f
3
+ size 6875816
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<pad>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer.json ADDED
@@ -0,0 +1,1906 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "<s>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<pad>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "</s>",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": "<unk>",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ }
42
+ ],
43
+ "normalizer": null,
44
+ "pre_tokenizer": {
45
+ "type": "ByteLevel",
46
+ "add_prefix_space": false,
47
+ "trim_offsets": true,
48
+ "use_regex": true
49
+ },
50
+ "post_processor": {
51
+ "type": "TemplateProcessing",
52
+ "single": [
53
+ {
54
+ "SpecialToken": {
55
+ "id": "<s>",
56
+ "type_id": 0
57
+ }
58
+ },
59
+ {
60
+ "Sequence": {
61
+ "id": "A",
62
+ "type_id": 0
63
+ }
64
+ },
65
+ {
66
+ "SpecialToken": {
67
+ "id": "</s>",
68
+ "type_id": 0
69
+ }
70
+ }
71
+ ],
72
+ "pair": [
73
+ {
74
+ "SpecialToken": {
75
+ "id": "<s>",
76
+ "type_id": 0
77
+ }
78
+ },
79
+ {
80
+ "Sequence": {
81
+ "id": "A",
82
+ "type_id": 0
83
+ }
84
+ },
85
+ {
86
+ "SpecialToken": {
87
+ "id": "</s>",
88
+ "type_id": 0
89
+ }
90
+ },
91
+ {
92
+ "SpecialToken": {
93
+ "id": "<s>",
94
+ "type_id": 0
95
+ }
96
+ },
97
+ {
98
+ "Sequence": {
99
+ "id": "B",
100
+ "type_id": 0
101
+ }
102
+ },
103
+ {
104
+ "SpecialToken": {
105
+ "id": "</s>",
106
+ "type_id": 0
107
+ }
108
+ }
109
+ ],
110
+ "special_tokens": {
111
+ "</s>": {
112
+ "id": "</s>",
113
+ "ids": [
114
+ 2
115
+ ],
116
+ "tokens": [
117
+ "</s>"
118
+ ]
119
+ },
120
+ "<s>": {
121
+ "id": "<s>",
122
+ "ids": [
123
+ 0
124
+ ],
125
+ "tokens": [
126
+ "<s>"
127
+ ]
128
+ }
129
+ }
130
+ },
131
+ "decoder": null,
132
+ "model": {
133
+ "type": "BPE",
134
+ "dropout": null,
135
+ "unk_token": "<unk>",
136
+ "continuing_subword_prefix": null,
137
+ "end_of_word_suffix": null,
138
+ "fuse_unk": false,
139
+ "byte_fallback": false,
140
+ "ignore_merges": false,
141
+ "vocab": {
142
+ "<s>": 0,
143
+ "<pad>": 1,
144
+ "</s>": 2,
145
+ "<unk>": 3,
146
+ "¡": 4,
147
+ "¢": 5,
148
+ "£": 6,
149
+ "¤": 7,
150
+ "¥": 8,
151
+ "¦": 9,
152
+ "§": 10,
153
+ "¨": 11,
154
+ "ª": 12,
155
+ "«": 13,
156
+ "¬": 14,
157
+ "®": 15,
158
+ "¯": 16,
159
+ "°": 17,
160
+ "±": 18,
161
+ "²": 19,
162
+ "´": 20,
163
+ "µ": 21,
164
+ "¶": 22,
165
+ "·": 23,
166
+ "¸": 24,
167
+ "¹": 25,
168
+ "º": 26,
169
+ "»": 27,
170
+ "¼": 28,
171
+ "½": 29,
172
+ "¾": 30,
173
+ "¿": 31,
174
+ "ã": 32,
175
+ "ä": 33,
176
+ "å": 34,
177
+ "æ": 35,
178
+ "ç": 36,
179
+ "è": 37,
180
+ "é": 38,
181
+ "ï": 39,
182
+ "Ċ": 40,
183
+ "Ġ": 41,
184
+ "Ģ": 42,
185
+ "ģ": 43,
186
+ "Ĥ": 44,
187
+ "ĥ": 45,
188
+ "Ħ": 46,
189
+ "ħ": 47,
190
+ "Ĩ": 48,
191
+ "ĩ": 49,
192
+ "Ī": 50,
193
+ "ī": 51,
194
+ "Ĭ": 52,
195
+ "ĭ": 53,
196
+ "Į": 54,
197
+ "į": 55,
198
+ "İ": 56,
199
+ "ı": 57,
200
+ "IJ": 58,
201
+ "ij": 59,
202
+ "Ĵ": 60,
203
+ "ĵ": 61,
204
+ "Ķ": 62,
205
+ "ķ": 63,
206
+ "ĸ": 64,
207
+ "Ĺ": 65,
208
+ "ĺ": 66,
209
+ "Ļ": 67,
210
+ "ļ": 68,
211
+ "Ľ": 69,
212
+ "Ŀ": 70,
213
+ "ŀ": 71,
214
+ "Ł": 72,
215
+ "ł": 73,
216
+ "Ń": 74,
217
+ "ãģ": 75,
218
+ "ãĤ": 76,
219
+ "ãĥ": 77,
220
+ "Ġå": 78,
221
+ "¼ģ": 79,
222
+ "ï¼ģ": 80,
223
+ "ãĤĴ": 81,
224
+ "ãģ®": 82,
225
+ "Ġãĥ": 83,
226
+ "ãĢ": 84,
227
+ "ãĢģ": 85,
228
+ "åĪ": 86,
229
+ "ãģij": 87,
230
+ "ãĤĭ": 88,
231
+ "¤ª": 89,
232
+ "¼ãĥ": 90,
233
+ "åŀ": 91,
234
+ "ãģª": 92,
235
+ "ãĤĮ": 93,
236
+ "Ġ太": 94,
237
+ "ãĤĴç": 95,
238
+ "ãģ®åŀ": 96,
239
+ "Ġãĥİ": 97,
240
+ "Ġãĥ¼ãĥ": 98,
241
+ "åĪĢ": 99,
242
+ "Ġ太åĪĢ": 100,
243
+ "ãģ®åŀĭ": 101,
244
+ "Ġãĥ¼ãĥ¼": 102,
245
+ "Ġæ": 103,
246
+ "ãģ¯": 104,
247
+ "ãģĦ": 105,
248
+ "Ġé": 106,
249
+ "ãģł": 107,
250
+ "±ãģ": 108,
251
+ "åIJ": 109,
252
+ "æĬ": 110,
253
+ "Ġç": 111,
254
+ "Ħãģ": 112,
255
+ "ĵãģ": 113,
256
+ "Ķãģ": 114,
257
+ "ãģ¦": 115,
258
+ "ãĤģ": 116,
259
+ "ãĤĤ": 117,
260
+ "ãĤĴæ": 118,
261
+ "ãģªãģĦ": 119,
262
+ "£±": 120,
263
+ "¨ãģ": 121,
264
+ "°´": 122,
265
+ "¼åIJ": 123,
266
+ "¾ãģ": 124,
267
+ "¿ĥ": 125,
268
+ "ä»": 126,
269
+ "ä½": 127,
270
+ "å®": 128,
271
+ "åij": 129,
272
+ "è¨": 130,
273
+ "éĸ": 131,
274
+ "ĥãĤ": 132,
275
+ "ĥãģł": 133,
276
+ "ĩĥãĤ": 134,
277
+ "Ĺãģ¦": 135,
278
+ "ĺãĤĮ": 136,
279
+ "łĶãģ": 137,
280
+ "ãģ¤": 138,
281
+ "ãģ¿": 139,
282
+ "ãģĵãģ": 140,
283
+ "ãĤī": 141,
284
+ "ãĤį": 142,
285
+ "Ġå¼": 143,
286
+ "Ġ壱": 144,
287
+ "Ġå¿ĥ": 145,
288
+ "ãĤĴé": 146,
289
+ "ãģ®ãģ": 147,
290
+ "ãģ®ãģ¯": 148,
291
+ "åĪĥãģł": 149,
292
+ "ãģijãĤĭ": 150,
293
+ "ãĤĴçĩĥãĤ": 151,
294
+ "ãĤĴçłĶãģ": 152,
295
+ "Ġæ°´": 153,
296
+ "±ãģķ": 154,
297
+ "æĬĺãĤĮ": 155,
298
+ "ĦãģĽ": 156,
299
+ "¼åIJ¸": 157,
300
+ "Ġå¿ĥãĤĴçĩĥãĤ": 158,
301
+ "ãĤĴçłĶãģİ": 159,
302
+ "Ġæ°´ãģ®åŀĭ": 160,
303
+ "Ġå¿ĥãĤĴçĩĥãĤĦãģĽ": 161,
304
+ "¡åĪ": 162,
305
+ "¢¨": 163,
306
+ "£¨": 164,
307
+ "£Ĥ": 165,
308
+ "¥ãĤĮ": 166,
309
+ "¦»": 167,
310
+ "¦ļ": 168,
311
+ "¦ãģ": 169,
312
+ "¦ãĤģ": 170,
313
+ "§Ĩ": 171,
314
+ "§ãĤĤ": 172,
315
+ "¨²": 173,
316
+ "¨é": 174,
317
+ "¨ãģ¯": 175,
318
+ "«ĭ": 176,
319
+ "«åij": 177,
320
+ "«¦ãĤģ": 178,
321
+ "¬¼": 179,
322
+ "Œ": 180,
323
+ "¾": 181,
324
+ "¬éĸ": 182,
325
+ "±º": 183,
326
+ "±ãģ®åŀĭ": 184,
327
+ "²éĸ": 185,
328
+ "²¬å": 186,
329
+ "µĤ": 187,
330
+ "¶ļ": 188,
331
+ "·ãģ": 189,
332
+ "·ãģ®åŀĭ": 190,
333
+ "¸ı": 191,
334
+ "¸Ń": 192,
335
+ "¸ãģijãĤĭ": 193,
336
+ "¹ãģł": 194,
337
+ "º¦ãģ": 195,
338
+ "¼ãĤģ": 196,
339
+ "¼·ãģ": 197,
340
+ "½ãĤĴæ": 198,
341
+ "½±ãģ®åŀĭ": 199,
342
+ "¾Ħãģ": 200,
343
+ "¾¼ãĤģ": 201,
344
+ "¿Ĺ": 202,
345
+ "¿ãĤĭ": 203,
346
+ "ä¸Ń": 204,
347
+ "妻": 205,
348
+ "度ãģ": 206,
349
+ "å¼·ãģ": 207,
350
+ "å¿Ĺ": 208,
351
+ "æģ": 209,
352
+ "æĤ": 210,
353
+ "æĦ": 211,
354
+ "æĸ": 212,
355
+ "æ¾Ħãģ": 213,
356
+ "çŀ": 214,
357
+ "ç«ĭ": 215,
358
+ "ç¶ļ": 216,
359
+ "èĤ": 217,
360
+ "èĥ": 218,
361
+ "è£Ĥ": 219,
362
+ "è¦ļ": 220,
363
+ "諦ãĤģ": 221,
364
+ "責å": 222,
365
+ "è¸ı": 223,
366
+ "è¾¼ãĤģ": 224,
367
+ "Ġä»": 225,
368
+ "Ġãģ¿": 226,
369
+ "ĠèĤ": 227,
370
+ "ĢãĤĴç": 228,
371
+ "Ĥİ": 229,
372
+ "ĥãģ¯": 230,
373
+ "ĥãģªãģĦ": 231,
374
+ "ĥãĤĴé": 232,
375
+ "ħ¨é": 233,
376
+ "ĨĨ": 234,
377
+ "Ĩä¸Ń": 235,
378
+ "ĩį": 236,
379
+ "ĩãĤĮ": 237,
380
+ "ĩãĤĴé": 238,
381
+ "ĩ¸ãģijãĤĭ": 239,
382
+ "ĪãĤĭ": 240,
383
+ "Īĥãģ¯": 241,
384
+ "Ĭãģ": 242,
385
+ "ĭĻ": 243,
386
+ "ĭãĤī": 244,
387
+ "ĮãĤĴ": 245,
388
+ "Įå®": 246,
389
+ "İãģ¤": 247,
390
+ "ıĤ": 248,
391
+ "ıı": 249,
392
+ "ıå¿Ĺ": 250,
393
+ "ıè¸ı": 251,
394
+ "IJãĤĮ": 252,
395
+ "ijãģijãĤĭ": 253,
396
+ "ij¼åIJ¸": 254,
397
+ "ĴĥãĤĴé": 255,
398
+ "ĵãĤĴ": 256,
399
+ "ĵãģ®": 257,
400
+ "ĵãĤĴçłĶãģİ": 258,
401
+ "ķãģ": 259,
402
+ "ķ度ãģ": 260,
403
+ "ĸŃ": 261,
404
+ "ĸ¬æ": 262,
405
+ "ĹĩãĤĴé": 263,
406
+ "ĺãĤ": 264,
407
+ "Ľ·ãģ®åŀĭ": 265,
408
+ "ĽĨä¸Ń": 266,
409
+ "Ŀãģ®ãģ": 267,
410
+ "Ŀå¼·ãģ": 268,
411
+ "Łãģ®": 269,
412
+ "ٱãģ": 270,
413
+ "ŁãĤģ": 271,
414
+ "ŁåĪĥãģł": 272,
415
+ "Ł¥ãĤĮ": 273,
416
+ "ŃãĤį": 274,
417
+ "ãģ¾ãģ": 275,
418
+ "ãģĹãģ¦": 276,
419
+ "ãģ¡åĪ": 277,
420
+ "ãģĭãĤī": 278,
421
+ "ãģĺãĤ": 279,
422
+ "ãģĿãģ®ãģ": 280,
423
+ "ãģŃãĤį": 281,
424
+ "Ġå½±ãģ®åŀĭ": 282,
425
+ "Ġåħ¨é": 283,
426
+ "ĠåĨĨ": 284,
427
+ "ĠåĪĥãģ¯": 285,
428
+ "ĠåıĤ": 286,
429
+ "Ġåij¼åIJ¸": 287,
430
+ "ãĤĴè¨": 288,
431
+ "ãĤĴè£Ĥ": 289,
432
+ "ãģ®è²¬å": 290,
433
+ "ãģijãĤį": 291,
434
+ "ãģijãģĺãĤ": 292,
435
+ "ãĤĭãģª": 293,
436
+ "ãĤĭãģ®ãģ¯": 294,
437
+ "ãģªãĤĤ": 295,
438
+ "ãģªãĤī": 296,
439
+ "ãĤĮãģªãģĦ": 297,
440
+ "ãĤĴçŁ¥ãĤĮ": 298,
441
+ "Ġ決": 299,
442
+ "Ġæĸ¬æ": 300,
443
+ "ĠæŁ±ãģ": 301,
444
+ "ãģ¯ç¶ļ": 302,
445
+ "ãģĦãĤĭ": 303,
446
+ "ãģĦãģ¦": 304,
447
+ "Ġ風": 305,
448
+ "Ġ鬼": 306,
449
+ "ĠéĹĩãĤĴé": 307,
450
+ "Ġ鼷ãģ®åŀĭ": 308,
451
+ "ãģłãģĭãĤī": 309,
452
+ "åIJijãģijãĤĭ": 310,
453
+ "æĬĢãĤĴç": 311,
454
+ "Ġ稲": 312,
455
+ "ĠçµĤ": 313,
456
+ "ĠçĤİ": 314,
457
+ "ĵãģ«åij": 315,
458
+ "Ķãģ¨ãģ": 316,
459
+ "ãĤĤãģ¾ãģ": 317,
460
+ "ãĤĴæıı": 318,
461
+ "ãĤĴæĸŃ": 319,
462
+ "¨ãģĹãģ¦": 320,
463
+ "¾ãģĽ": 321,
464
+ "ä»Ĭãģ": 322,
465
+ "ä½ĵãĤĴçłĶãģİ": 323,
466
+ "ä½ķ度ãģ": 324,
467
+ "å®ĪãĤĭ": 325,
468
+ "åij¼åIJ¸": 326,
469
+ "許ãģķ": 327,
470
+ "ãģ¿è¾¼ãĤģ": 328,
471
+ "ãģĵãģ¨ãģ¯": 329,
472
+ "ãģĵãģĿå¼·ãģ": 330,
473
+ "Ġå¼IJ": 331,
474
+ "Ġå¼±ãģķ": 332,
475
+ "ãģ®ãģĶãģ¨ãģ": 333,
476
+ "ãģ®ãģ¯åĪĥãģł": 334,
477
+ "æĬĺãĤĮãģªãģĦ": 335,
478
+ "æĬĺãĤĮãĤĭãģ®ãģ¯": 336,
479
+ "ãĤĴçłĶãģİæ¾Ħãģ": 337,
480
+ "£¨ãģij": 338,
481
+ "§ĨãģijãĤį": 339,
482
+ "§ãĤĤç«ĭ": 340,
483
+ "¬éĸĵãģ«åij": 341,
484
+ "²éĸĵãĤĴ": 342,
485
+ "½ãĤĴæĩ¸ãģijãĤĭ": 343,
486
+ "妻ãģ®ãģĶãģ¨ãģ": 344,
487
+ "æģIJãĤĮ": 345,
488
+ "æĤŁãģ®": 346,
489
+ "æĦıå¿Ĺ": 347,
490
+ "æĸ¹ãģł": 348,
491
+ "çŀ¬éĸĵãģ«åij": 349,
492
+ "èĥĮãĤĴ": 350,
493
+ "è¦ļæĤŁãģ®": 351,
494
+ "諦ãĤģãĤĭãģª": 352,
495
+ "Ġ仲éĸĵãĤĴ": 353,
496
+ "Ġãģ¿ãģªãĤĤ": 354,
497
+ "ĠèĤĨ": 355,
498
+ "ĩįãģŃãĤį": 356,
499
+ "Į宿ãĤĭ": 357,
500
+ "İãģ¤ãģ®ãģ¯åĪĥãģł": 358,
501
+ "ıè¸ıãģ¿è¾¼ãĤģ": 359,
502
+ "ĴĥãĤĴéĩįãģŃãĤį": 360,
503
+ "ĵãģ®çŀ¬éĸĵãģ«åij": 361,
504
+ "ķãģĮ宿ãĤĭ": 362,
505
+ "ŁãĤģãģªãĤī": 363,
506
+ "ãģĹãģ¦è«¦ãĤģãĤĭãģª": 364,
507
+ "ãģ¡åĪĩãĤĮ": 365,
508
+ "ãģĿãģ®ãģŁãĤģãģªãĤī": 366,
509
+ "Ġåħ¨éĽĨä¸Ń": 367,
510
+ "ĠåĨĨãĤĴæıı": 368,
511
+ "ĠåĪĥã읿ĬĺãĤĮãģªãģĦ": 369,
512
+ "Ġåij¼åIJ¸ãĤĴçłĶãģİæ¾Ħãģ": 370,
513
+ "ãĤĴè¨İãģ¤ãģ®ãģ¯åĪĥãģł": 371,
514
+ "ãĤĴè£Ĥãģij": 372,
515
+ "ãģ®è²¬åĭĻ": 373,
516
+ "ãģijãģĺãĤĥãģªãģĦ": 374,
517
+ "Ġ決ãģĹãģ¦è«¦ãĤģãĤĭãģª": 375,
518
+ "Ġæĸ¬æĴĥãĤĴéĩįãģŃãĤį": 376,
519
+ "ĠæŁ±ãģ¨ãģĹãģ¦": 377,
520
+ "ãģ¯ç¶ļãģĦãģ¦": 378,
521
+ "Ġ風ãģ®åŀĭ": 379,
522
+ "Ġ鬼ãĤĴè¨İãģ¤ãģ®ãģ¯åĪĥãģł": 380,
523
+ "ĠéĹĩãĤĴé§ĨãģijãĤį": 381,
524
+ "ãģłãģĭãĤīãģĵãģĿå¼·ãģ": 382,
525
+ "åIJijãģijãĤĭãģĵãģ¨ãģ¯": 383,
526
+ "æĬĢãĤĴ磨ãģij": 384,
527
+ "Ġ稲妻ãģ®ãģĶãģ¨ãģ": 385,
528
+ "ĠçĤİãģ®åŀĭ": 386,
529
+ "ãĤĤãģ¾ãģŁåĪĥãģł": 387,
530
+ "ãĤĴæĸŃãģ¡åĪĩãĤĮ": 388,
531
+ "ä»Ĭãģĵãģ®çŀ¬éĸĵãģ«åij": 389,
532
+ "ä½ķ度ãģ§ãĤĤç«ĭ": 390,
533
+ "åij¼åIJ¸ãģ¯ç¶ļãģĦãģ¦": 391,
534
+ "許ãģķãĤĮãģªãģĦ": 392,
535
+ "Ġå¼±ãģķãĤĴçŁ¥ãĤĮ": 393,
536
+ "æĬĺãĤĮãĤĭãģ®ãģ¯è¦ļæĤŁãģ®": 394,
537
+ "æģIJãĤĮãĤĴæĸŃãģ¡åĪĩãĤĮ": 395,
538
+ "æĦıå¿ĹãĤĤãģ¾ãģŁåĪĥãģł": 396,
539
+ "èĥĮãĤĴåIJijãģijãĤĭãģĵãģ¨ãģ¯": 397,
540
+ "Ġ仲éĸĵãĤĴå®ĪãĤĭ": 398,
541
+ "Ġãģ¿ãģªãĤĤãĤĴè£Ĥãģij": 399,
542
+ "ãģĿãģ®ãģŁãĤģãģªãĤīä½ķ度ãģ§ãĤĤç«ĭ": 400,
543
+ "ĠåĨĨãĤĴæııãģij": 401,
544
+ "Ġåij¼åIJ¸ãĤĴçłĶãģİæ¾Ħãģ¾ãģĽ": 402,
545
+ "ĠæŁ±ãģ¨ãģĹãģ¦ãģ®è²¬åĭĻ": 403,
546
+ "Ġ鬼ãĤĴè¨İãģ¤ãģ®ãģ¯åĪĥãģłãģijãģĺãĤĥãģªãģĦ": 404,
547
+ "ãģłãģĭãĤīãģĵãģĿå¼·ãģķãģĮ宿ãĤĭ": 405,
548
+ "Ġ稲妻ãģ®ãģĶãģ¨ãģıè¸ıãģ¿è¾¼ãĤģ": 406,
549
+ "ä»Ĭãģĵãģ®çŀ¬éĸĵãģ«åij½ãĤĴæĩ¸ãģijãĤĭ": 407,
550
+ "åij¼åIJ¸ãģ¯ç¶ļãģĦãģ¦ãģĦãĤĭ": 408,
551
+ "æĬĺãĤĮãĤĭãģ®ãģ¯è¦ļæĤŁã쮿ĸ¹ãģł": 409,
552
+ "èĥĮãĤĴåIJijãģijãĤĭãģĵãģ¨ãģ¯è¨±ãģķãĤĮãģªãģĦ": 410,
553
+ "ãģĿãģ®ãģŁãĤģãģªãĤīä½ķ度ãģ§ãĤĤç«ĭãģ¤": 411
554
+ },
555
+ "merges": [
556
+ [
557
+ "ã",
558
+ "ģ"
559
+ ],
560
+ [
561
+ "ã",
562
+ "Ĥ"
563
+ ],
564
+ [
565
+ "ã",
566
+ "ĥ"
567
+ ],
568
+ [
569
+ "Ġ",
570
+ "å"
571
+ ],
572
+ [
573
+ "¼",
574
+ "ģ"
575
+ ],
576
+ [
577
+ "ï",
578
+ "¼ģ"
579
+ ],
580
+ [
581
+ "ãĤ",
582
+ "Ĵ"
583
+ ],
584
+ [
585
+ "ãģ",
586
+ "®"
587
+ ],
588
+ [
589
+ "Ġ",
590
+ "ãĥ"
591
+ ],
592
+ [
593
+ "ã",
594
+ "Ģ"
595
+ ],
596
+ [
597
+ "ãĢ",
598
+ "ģ"
599
+ ],
600
+ [
601
+ "å",
602
+ "Ī"
603
+ ],
604
+ [
605
+ "ãģ",
606
+ "ij"
607
+ ],
608
+ [
609
+ "ãĤ",
610
+ "ĭ"
611
+ ],
612
+ [
613
+ "¤",
614
+ "ª"
615
+ ],
616
+ [
617
+ "¼",
618
+ "ãĥ"
619
+ ],
620
+ [
621
+ "å",
622
+ "ŀ"
623
+ ],
624
+ [
625
+ "ãģ",
626
+ "ª"
627
+ ],
628
+ [
629
+ "ãĤ",
630
+ "Į"
631
+ ],
632
+ [
633
+ "Ġå",
634
+ "¤ª"
635
+ ],
636
+ [
637
+ "ãĤĴ",
638
+ "ç"
639
+ ],
640
+ [
641
+ "ãģ®",
642
+ "åŀ"
643
+ ],
644
+ [
645
+ "Ġãĥ",
646
+ "İ"
647
+ ],
648
+ [
649
+ "Ġãĥ",
650
+ "¼ãĥ"
651
+ ],
652
+ [
653
+ "åĪ",
654
+ "Ģ"
655
+ ],
656
+ [
657
+ "Ġ太",
658
+ "åĪĢ"
659
+ ],
660
+ [
661
+ "ãģ®åŀ",
662
+ "ĭ"
663
+ ],
664
+ [
665
+ "Ġãĥ¼ãĥ",
666
+ "¼"
667
+ ],
668
+ [
669
+ "Ġ",
670
+ "æ"
671
+ ],
672
+ [
673
+ "ãģ",
674
+ "¯"
675
+ ],
676
+ [
677
+ "ãģ",
678
+ "Ħ"
679
+ ],
680
+ [
681
+ "Ġ",
682
+ "é"
683
+ ],
684
+ [
685
+ "ãģ",
686
+ "ł"
687
+ ],
688
+ [
689
+ "±",
690
+ "ãģ"
691
+ ],
692
+ [
693
+ "å",
694
+ "IJ"
695
+ ],
696
+ [
697
+ "æ",
698
+ "Ĭ"
699
+ ],
700
+ [
701
+ "Ġ",
702
+ "ç"
703
+ ],
704
+ [
705
+ "Ħ",
706
+ "ãģ"
707
+ ],
708
+ [
709
+ "ĵ",
710
+ "ãģ"
711
+ ],
712
+ [
713
+ "Ķ",
714
+ "ãģ"
715
+ ],
716
+ [
717
+ "ãģ",
718
+ "¦"
719
+ ],
720
+ [
721
+ "ãĤ",
722
+ "ģ"
723
+ ],
724
+ [
725
+ "ãĤ",
726
+ "Ĥ"
727
+ ],
728
+ [
729
+ "ãĤĴ",
730
+ "æ"
731
+ ],
732
+ [
733
+ "ãģª",
734
+ "ãģĦ"
735
+ ],
736
+ [
737
+ "£",
738
+ "±"
739
+ ],
740
+ [
741
+ "¨",
742
+ "ãģ"
743
+ ],
744
+ [
745
+ "°",
746
+ "´"
747
+ ],
748
+ [
749
+ "¼",
750
+ "åIJ"
751
+ ],
752
+ [
753
+ "¾",
754
+ "ãģ"
755
+ ],
756
+ [
757
+ "¿",
758
+ "ĥ"
759
+ ],
760
+ [
761
+ "ä",
762
+ "»"
763
+ ],
764
+ [
765
+ "ä",
766
+ "½"
767
+ ],
768
+ [
769
+ "å",
770
+ "®"
771
+ ],
772
+ [
773
+ "å",
774
+ "ij"
775
+ ],
776
+ [
777
+ "è",
778
+ "¨"
779
+ ],
780
+ [
781
+ "é",
782
+ "ĸ"
783
+ ],
784
+ [
785
+ "ĥ",
786
+ "ãĤ"
787
+ ],
788
+ [
789
+ "ĥ",
790
+ "ãģł"
791
+ ],
792
+ [
793
+ "ĩ",
794
+ "ĥãĤ"
795
+ ],
796
+ [
797
+ "Ĺ",
798
+ "ãģ¦"
799
+ ],
800
+ [
801
+ "ĺ",
802
+ "ãĤĮ"
803
+ ],
804
+ [
805
+ "ł",
806
+ "Ķãģ"
807
+ ],
808
+ [
809
+ "ãģ",
810
+ "¤"
811
+ ],
812
+ [
813
+ "ãģ",
814
+ "¿"
815
+ ],
816
+ [
817
+ "ãģ",
818
+ "ĵãģ"
819
+ ],
820
+ [
821
+ "ãĤ",
822
+ "ī"
823
+ ],
824
+ [
825
+ "ãĤ",
826
+ "į"
827
+ ],
828
+ [
829
+ "Ġå",
830
+ "¼"
831
+ ],
832
+ [
833
+ "Ġå",
834
+ "£±"
835
+ ],
836
+ [
837
+ "Ġå",
838
+ "¿ĥ"
839
+ ],
840
+ [
841
+ "ãĤĴ",
842
+ "é"
843
+ ],
844
+ [
845
+ "ãģ®",
846
+ "ãģ"
847
+ ],
848
+ [
849
+ "ãģ®",
850
+ "ãģ¯"
851
+ ],
852
+ [
853
+ "åĪ",
854
+ "ĥãģł"
855
+ ],
856
+ [
857
+ "ãģij",
858
+ "ãĤĭ"
859
+ ],
860
+ [
861
+ "ãĤĴç",
862
+ "ĩĥãĤ"
863
+ ],
864
+ [
865
+ "ãĤĴç",
866
+ "łĶãģ"
867
+ ],
868
+ [
869
+ "Ġæ",
870
+ "°´"
871
+ ],
872
+ [
873
+ "±ãģ",
874
+ "ķ"
875
+ ],
876
+ [
877
+ "æĬ",
878
+ "ĺãĤĮ"
879
+ ],
880
+ [
881
+ "Ħãģ",
882
+ "Ľ"
883
+ ],
884
+ [
885
+ "¼åIJ",
886
+ "¸"
887
+ ],
888
+ [
889
+ "Ġå¿ĥ",
890
+ "ãĤĴçĩĥãĤ"
891
+ ],
892
+ [
893
+ "ãĤĴçłĶãģ",
894
+ "İ"
895
+ ],
896
+ [
897
+ "Ġæ°´",
898
+ "ãģ®åŀĭ"
899
+ ],
900
+ [
901
+ "Ġå¿ĥãĤĴçĩĥãĤ",
902
+ "ĦãģĽ"
903
+ ],
904
+ [
905
+ "¡",
906
+ "åĪ"
907
+ ],
908
+ [
909
+ "¢",
910
+ "¨"
911
+ ],
912
+ [
913
+ "£",
914
+ "¨"
915
+ ],
916
+ [
917
+ "£",
918
+ "Ĥ"
919
+ ],
920
+ [
921
+ "¥",
922
+ "ãĤĮ"
923
+ ],
924
+ [
925
+ "¦",
926
+ "»"
927
+ ],
928
+ [
929
+ "¦",
930
+ "ļ"
931
+ ],
932
+ [
933
+ "¦",
934
+ "ãģ"
935
+ ],
936
+ [
937
+ "¦",
938
+ "ãĤģ"
939
+ ],
940
+ [
941
+ "§",
942
+ "Ĩ"
943
+ ],
944
+ [
945
+ "§",
946
+ "ãĤĤ"
947
+ ],
948
+ [
949
+ "¨",
950
+ "²"
951
+ ],
952
+ [
953
+ "¨",
954
+ "é"
955
+ ],
956
+ [
957
+ "¨",
958
+ "ãģ¯"
959
+ ],
960
+ [
961
+ "«",
962
+ "ĭ"
963
+ ],
964
+ [
965
+ "«",
966
+ "åij"
967
+ ],
968
+ [
969
+ "«",
970
+ "¦ãĤģ"
971
+ ],
972
+ [
973
+ "¬",
974
+ "¼"
975
+ ],
976
+ [
977
+ "¬",
978
+ "å"
979
+ ],
980
+ [
981
+ "¬",
982
+ "æ"
983
+ ],
984
+ [
985
+ "¬",
986
+ "éĸ"
987
+ ],
988
+ [
989
+ "±",
990
+ "º"
991
+ ],
992
+ [
993
+ "±",
994
+ "ãģ®åŀĭ"
995
+ ],
996
+ [
997
+ "²",
998
+ "éĸ"
999
+ ],
1000
+ [
1001
+ "²",
1002
+ "Œ"
1003
+ ],
1004
+ [
1005
+ "µ",
1006
+ "Ĥ"
1007
+ ],
1008
+ [
1009
+ "¶",
1010
+ "ļ"
1011
+ ],
1012
+ [
1013
+ "·",
1014
+ "ãģ"
1015
+ ],
1016
+ [
1017
+ "·",
1018
+ "ãģ®åŀĭ"
1019
+ ],
1020
+ [
1021
+ "¸",
1022
+ "ı"
1023
+ ],
1024
+ [
1025
+ "¸",
1026
+ "Ń"
1027
+ ],
1028
+ [
1029
+ "¸",
1030
+ "ãģijãĤĭ"
1031
+ ],
1032
+ [
1033
+ "¹",
1034
+ "ãģł"
1035
+ ],
1036
+ [
1037
+ "º",
1038
+ "¦ãģ"
1039
+ ],
1040
+ [
1041
+ "¼",
1042
+ "ãĤģ"
1043
+ ],
1044
+ [
1045
+ "¼",
1046
+ "·ãģ"
1047
+ ],
1048
+ [
1049
+ "½",
1050
+ "ãĤĴæ"
1051
+ ],
1052
+ [
1053
+ "½",
1054
+ "±ãģ®åŀĭ"
1055
+ ],
1056
+ [
1057
+ "¾",
1058
+ "Ħãģ"
1059
+ ],
1060
+ [
1061
+ "¾",
1062
+ "¼ãĤģ"
1063
+ ],
1064
+ [
1065
+ "¿",
1066
+ "Ĺ"
1067
+ ],
1068
+ [
1069
+ "¿",
1070
+ "ãĤĭ"
1071
+ ],
1072
+ [
1073
+ "ä",
1074
+ "¸Ń"
1075
+ ],
1076
+ [
1077
+ "å",
1078
+ "¦»"
1079
+ ],
1080
+ [
1081
+ "å",
1082
+ "º¦ãģ"
1083
+ ],
1084
+ [
1085
+ "å",
1086
+ "¼·ãģ"
1087
+ ],
1088
+ [
1089
+ "å",
1090
+ "¿Ĺ"
1091
+ ],
1092
+ [
1093
+ "æ",
1094
+ "ģ"
1095
+ ],
1096
+ [
1097
+ "æ",
1098
+ "Ĥ"
1099
+ ],
1100
+ [
1101
+ "æ",
1102
+ "Ħ"
1103
+ ],
1104
+ [
1105
+ "æ",
1106
+ "ĸ"
1107
+ ],
1108
+ [
1109
+ "æ",
1110
+ "¾Ħãģ"
1111
+ ],
1112
+ [
1113
+ "ç",
1114
+ "ŀ"
1115
+ ],
1116
+ [
1117
+ "ç",
1118
+ "«ĭ"
1119
+ ],
1120
+ [
1121
+ "ç",
1122
+ "¶ļ"
1123
+ ],
1124
+ [
1125
+ "è",
1126
+ "Ĥ"
1127
+ ],
1128
+ [
1129
+ "è",
1130
+ "ĥ"
1131
+ ],
1132
+ [
1133
+ "è",
1134
+ "£Ĥ"
1135
+ ],
1136
+ [
1137
+ "è",
1138
+ "¦ļ"
1139
+ ],
1140
+ [
1141
+ "è",
1142
+ "«¦ãĤģ"
1143
+ ],
1144
+ [
1145
+ "è",
1146
+ "²¬å"
1147
+ ],
1148
+ [
1149
+ "è",
1150
+ "¸ı"
1151
+ ],
1152
+ [
1153
+ "è",
1154
+ "¾¼ãĤģ"
1155
+ ],
1156
+ [
1157
+ "Ġ",
1158
+ "ä»"
1159
+ ],
1160
+ [
1161
+ "Ġ",
1162
+ "ãģ¿"
1163
+ ],
1164
+ [
1165
+ "Ġ",
1166
+ "èĤ"
1167
+ ],
1168
+ [
1169
+ "Ģ",
1170
+ "ãĤĴç"
1171
+ ],
1172
+ [
1173
+ "Ĥ",
1174
+ "İ"
1175
+ ],
1176
+ [
1177
+ "ĥ",
1178
+ "ãģ¯"
1179
+ ],
1180
+ [
1181
+ "ĥ",
1182
+ "ãģªãģĦ"
1183
+ ],
1184
+ [
1185
+ "ĥ",
1186
+ "ãĤĴé"
1187
+ ],
1188
+ [
1189
+ "ħ",
1190
+ "¨é"
1191
+ ],
1192
+ [
1193
+ "Ĩ",
1194
+ "Ĩ"
1195
+ ],
1196
+ [
1197
+ "Ĩ",
1198
+ "ä¸Ń"
1199
+ ],
1200
+ [
1201
+ "ĩ",
1202
+ "į"
1203
+ ],
1204
+ [
1205
+ "ĩ",
1206
+ "ãĤĮ"
1207
+ ],
1208
+ [
1209
+ "ĩ",
1210
+ "ãĤĴé"
1211
+ ],
1212
+ [
1213
+ "ĩ",
1214
+ "¸ãģijãĤĭ"
1215
+ ],
1216
+ [
1217
+ "Ī",
1218
+ "ãĤĭ"
1219
+ ],
1220
+ [
1221
+ "Ī",
1222
+ "ĥãģ¯"
1223
+ ],
1224
+ [
1225
+ "Ĭ",
1226
+ "ãģ"
1227
+ ],
1228
+ [
1229
+ "ĭ",
1230
+ "Ļ"
1231
+ ],
1232
+ [
1233
+ "ĭ",
1234
+ "ãĤī"
1235
+ ],
1236
+ [
1237
+ "Į",
1238
+ "ãĤĴ"
1239
+ ],
1240
+ [
1241
+ "Į",
1242
+ "å®"
1243
+ ],
1244
+ [
1245
+ "İ",
1246
+ "ãģ¤"
1247
+ ],
1248
+ [
1249
+ "ı",
1250
+ "Ĥ"
1251
+ ],
1252
+ [
1253
+ "ı",
1254
+ "ı"
1255
+ ],
1256
+ [
1257
+ "ı",
1258
+ "å¿Ĺ"
1259
+ ],
1260
+ [
1261
+ "ı",
1262
+ "è¸ı"
1263
+ ],
1264
+ [
1265
+ "IJ",
1266
+ "ãĤĮ"
1267
+ ],
1268
+ [
1269
+ "ij",
1270
+ "ãģijãĤĭ"
1271
+ ],
1272
+ [
1273
+ "ij",
1274
+ "¼åIJ¸"
1275
+ ],
1276
+ [
1277
+ "Ĵ",
1278
+ "ĥãĤĴé"
1279
+ ],
1280
+ [
1281
+ "ĵ",
1282
+ "ãĤĴ"
1283
+ ],
1284
+ [
1285
+ "ĵ",
1286
+ "ãģ®"
1287
+ ],
1288
+ [
1289
+ "ĵ",
1290
+ "ãĤĴçłĶãģİ"
1291
+ ],
1292
+ [
1293
+ "ķ",
1294
+ "ãģ"
1295
+ ],
1296
+ [
1297
+ "ķ",
1298
+ "度ãģ"
1299
+ ],
1300
+ [
1301
+ "ĸ",
1302
+ "Ń"
1303
+ ],
1304
+ [
1305
+ "ĸ",
1306
+ "¾"
1307
+ ],
1308
+ [
1309
+ "Ĺ",
1310
+ "ĩãĤĴé"
1311
+ ],
1312
+ [
1313
+ "ĺ",
1314
+ "ãĤ"
1315
+ ],
1316
+ [
1317
+ "Ľ",
1318
+ "·ãģ®åŀĭ"
1319
+ ],
1320
+ [
1321
+ "Ľ",
1322
+ "Ĩä¸Ń"
1323
+ ],
1324
+ [
1325
+ "Ŀ",
1326
+ "ãģ®ãģ"
1327
+ ],
1328
+ [
1329
+ "Ŀ",
1330
+ "å¼·ãģ"
1331
+ ],
1332
+ [
1333
+ "Ł",
1334
+ "ãģ®"
1335
+ ],
1336
+ [
1337
+ "Ł",
1338
+ "±ãģ"
1339
+ ],
1340
+ [
1341
+ "Ł",
1342
+ "ãĤģ"
1343
+ ],
1344
+ [
1345
+ "Ł",
1346
+ "åĪĥãģł"
1347
+ ],
1348
+ [
1349
+ "Ł",
1350
+ "¥ãĤĮ"
1351
+ ],
1352
+ [
1353
+ "Ń",
1354
+ "ãĤį"
1355
+ ],
1356
+ [
1357
+ "ãģ",
1358
+ "¾ãģ"
1359
+ ],
1360
+ [
1361
+ "ãģ",
1362
+ "Ĺãģ¦"
1363
+ ],
1364
+ [
1365
+ "ãģ",
1366
+ "¡åĪ"
1367
+ ],
1368
+ [
1369
+ "ãģ",
1370
+ "ĭãĤī"
1371
+ ],
1372
+ [
1373
+ "ãģ",
1374
+ "ĺãĤ"
1375
+ ],
1376
+ [
1377
+ "ãģ",
1378
+ "Ŀãģ®ãģ"
1379
+ ],
1380
+ [
1381
+ "ãģ",
1382
+ "ŃãĤį"
1383
+ ],
1384
+ [
1385
+ "Ġå",
1386
+ "½±ãģ®åŀĭ"
1387
+ ],
1388
+ [
1389
+ "Ġå",
1390
+ "ħ¨é"
1391
+ ],
1392
+ [
1393
+ "Ġå",
1394
+ "ĨĨ"
1395
+ ],
1396
+ [
1397
+ "Ġå",
1398
+ "Īĥãģ¯"
1399
+ ],
1400
+ [
1401
+ "Ġå",
1402
+ "ıĤ"
1403
+ ],
1404
+ [
1405
+ "Ġå",
1406
+ "ij¼åIJ¸"
1407
+ ],
1408
+ [
1409
+ "ãĤĴ",
1410
+ "è¨"
1411
+ ],
1412
+ [
1413
+ "ãĤĴ",
1414
+ "è£Ĥ"
1415
+ ],
1416
+ [
1417
+ "ãģ®",
1418
+ "責å"
1419
+ ],
1420
+ [
1421
+ "ãģij",
1422
+ "ãĤį"
1423
+ ],
1424
+ [
1425
+ "ãģij",
1426
+ "ãģĺãĤ"
1427
+ ],
1428
+ [
1429
+ "ãĤĭ",
1430
+ "ãģª"
1431
+ ],
1432
+ [
1433
+ "ãĤĭ",
1434
+ "ãģ®ãģ¯"
1435
+ ],
1436
+ [
1437
+ "ãģª",
1438
+ "ãĤĤ"
1439
+ ],
1440
+ [
1441
+ "ãģª",
1442
+ "ãĤī"
1443
+ ],
1444
+ [
1445
+ "ãĤĮ",
1446
+ "ãģªãģĦ"
1447
+ ],
1448
+ [
1449
+ "ãĤĴç",
1450
+ "Ł¥ãĤĮ"
1451
+ ],
1452
+ [
1453
+ "Ġæ",
1454
+ "±º"
1455
+ ],
1456
+ [
1457
+ "Ġæ",
1458
+ "ĸ¬æ"
1459
+ ],
1460
+ [
1461
+ "Ġæ",
1462
+ "ٱãģ"
1463
+ ],
1464
+ [
1465
+ "ãģ¯",
1466
+ "ç¶ļ"
1467
+ ],
1468
+ [
1469
+ "ãģĦ",
1470
+ "ãĤĭ"
1471
+ ],
1472
+ [
1473
+ "ãģĦ",
1474
+ "ãģ¦"
1475
+ ],
1476
+ [
1477
+ "Ġé",
1478
+ "¢¨"
1479
+ ],
1480
+ [
1481
+ "Ġé",
1482
+ "¬¼"
1483
+ ],
1484
+ [
1485
+ "Ġé",
1486
+ "ĹĩãĤĴé"
1487
+ ],
1488
+ [
1489
+ "Ġé",
1490
+ "Ľ·ãģ®åŀĭ"
1491
+ ],
1492
+ [
1493
+ "ãģł",
1494
+ "ãģĭãĤī"
1495
+ ],
1496
+ [
1497
+ "åIJ",
1498
+ "ijãģijãĤĭ"
1499
+ ],
1500
+ [
1501
+ "æĬ",
1502
+ "ĢãĤĴç"
1503
+ ],
1504
+ [
1505
+ "Ġç",
1506
+ "¨²"
1507
+ ],
1508
+ [
1509
+ "Ġç",
1510
+ "µĤ"
1511
+ ],
1512
+ [
1513
+ "Ġç",
1514
+ "Ĥİ"
1515
+ ],
1516
+ [
1517
+ "ĵãģ",
1518
+ "«åij"
1519
+ ],
1520
+ [
1521
+ "Ķãģ",
1522
+ "¨ãģ"
1523
+ ],
1524
+ [
1525
+ "ãĤĤ",
1526
+ "ãģ¾ãģ"
1527
+ ],
1528
+ [
1529
+ "ãĤĴæ",
1530
+ "ıı"
1531
+ ],
1532
+ [
1533
+ "ãĤĴæ",
1534
+ "ĸŃ"
1535
+ ],
1536
+ [
1537
+ "¨ãģ",
1538
+ "Ĺãģ¦"
1539
+ ],
1540
+ [
1541
+ "¾ãģ",
1542
+ "Ľ"
1543
+ ],
1544
+ [
1545
+ "ä»",
1546
+ "Ĭãģ"
1547
+ ],
1548
+ [
1549
+ "ä½",
1550
+ "ĵãĤĴçłĶãģİ"
1551
+ ],
1552
+ [
1553
+ "ä½",
1554
+ "ķ度ãģ"
1555
+ ],
1556
+ [
1557
+ "å®",
1558
+ "ĪãĤĭ"
1559
+ ],
1560
+ [
1561
+ "åij",
1562
+ "¼åIJ¸"
1563
+ ],
1564
+ [
1565
+ "è¨",
1566
+ "±ãģķ"
1567
+ ],
1568
+ [
1569
+ "ãģ¿",
1570
+ "è¾¼ãĤģ"
1571
+ ],
1572
+ [
1573
+ "ãģĵãģ",
1574
+ "¨ãģ¯"
1575
+ ],
1576
+ [
1577
+ "ãģĵãģ",
1578
+ "Ŀå¼·ãģ"
1579
+ ],
1580
+ [
1581
+ "Ġå¼",
1582
+ "IJ"
1583
+ ],
1584
+ [
1585
+ "Ġå¼",
1586
+ "±ãģķ"
1587
+ ],
1588
+ [
1589
+ "ãģ®ãģ",
1590
+ "Ķãģ¨ãģ"
1591
+ ],
1592
+ [
1593
+ "ãģ®ãģ¯",
1594
+ "åĪĥãģł"
1595
+ ],
1596
+ [
1597
+ "æĬĺãĤĮ",
1598
+ "ãģªãģĦ"
1599
+ ],
1600
+ [
1601
+ "æĬĺãĤĮ",
1602
+ "ãĤĭãģ®ãģ¯"
1603
+ ],
1604
+ [
1605
+ "ãĤĴçłĶãģİ",
1606
+ "æ¾Ħãģ"
1607
+ ],
1608
+ [
1609
+ "£¨",
1610
+ "ãģij"
1611
+ ],
1612
+ [
1613
+ "§Ĩ",
1614
+ "ãģijãĤį"
1615
+ ],
1616
+ [
1617
+ "§ãĤĤ",
1618
+ "ç«ĭ"
1619
+ ],
1620
+ [
1621
+ "¬éĸ",
1622
+ "ĵãģ«åij"
1623
+ ],
1624
+ [
1625
+ "²éĸ",
1626
+ "ĵãĤĴ"
1627
+ ],
1628
+ [
1629
+ "½ãĤĴæ",
1630
+ "ĩ¸ãģijãĤĭ"
1631
+ ],
1632
+ [
1633
+ "妻",
1634
+ "ãģ®ãģĶãģ¨ãģ"
1635
+ ],
1636
+ [
1637
+ "æģ",
1638
+ "IJãĤĮ"
1639
+ ],
1640
+ [
1641
+ "æĤ",
1642
+ "Łãģ®"
1643
+ ],
1644
+ [
1645
+ "æĦ",
1646
+ "ıå¿Ĺ"
1647
+ ],
1648
+ [
1649
+ "æĸ",
1650
+ "¹ãģł"
1651
+ ],
1652
+ [
1653
+ "çŀ",
1654
+ "¬éĸĵãģ«åij"
1655
+ ],
1656
+ [
1657
+ "èĥ",
1658
+ "ĮãĤĴ"
1659
+ ],
1660
+ [
1661
+ "è¦ļ",
1662
+ "æĤŁãģ®"
1663
+ ],
1664
+ [
1665
+ "諦ãĤģ",
1666
+ "ãĤĭãģª"
1667
+ ],
1668
+ [
1669
+ "Ġä»",
1670
+ "²éĸĵãĤĴ"
1671
+ ],
1672
+ [
1673
+ "Ġãģ¿",
1674
+ "ãģªãĤĤ"
1675
+ ],
1676
+ [
1677
+ "ĠèĤ",
1678
+ "Ĩ"
1679
+ ],
1680
+ [
1681
+ "ĩį",
1682
+ "ãģŃãĤį"
1683
+ ],
1684
+ [
1685
+ "Įå®",
1686
+ "¿ãĤĭ"
1687
+ ],
1688
+ [
1689
+ "İãģ¤",
1690
+ "ãģ®ãģ¯åĪĥãģł"
1691
+ ],
1692
+ [
1693
+ "ıè¸ı",
1694
+ "ãģ¿è¾¼ãĤģ"
1695
+ ],
1696
+ [
1697
+ "ĴĥãĤĴé",
1698
+ "ĩįãģŃãĤį"
1699
+ ],
1700
+ [
1701
+ "ĵãģ®",
1702
+ "çŀ¬éĸĵãģ«åij"
1703
+ ],
1704
+ [
1705
+ "ķãģ",
1706
+ "Į宿ãĤĭ"
1707
+ ],
1708
+ [
1709
+ "ŁãĤģ",
1710
+ "ãģªãĤī"
1711
+ ],
1712
+ [
1713
+ "ãģĹãģ¦",
1714
+ "諦ãĤģãĤĭãģª"
1715
+ ],
1716
+ [
1717
+ "ãģ¡åĪ",
1718
+ "ĩãĤĮ"
1719
+ ],
1720
+ [
1721
+ "ãģĿãģ®ãģ",
1722
+ "ŁãĤģãģªãĤī"
1723
+ ],
1724
+ [
1725
+ "Ġåħ¨é",
1726
+ "ĽĨä¸Ń"
1727
+ ],
1728
+ [
1729
+ "ĠåĨĨ",
1730
+ "ãĤĴæıı"
1731
+ ],
1732
+ [
1733
+ "ĠåĪĥãģ¯",
1734
+ "æĬĺãĤĮãģªãģĦ"
1735
+ ],
1736
+ [
1737
+ "Ġåij¼åIJ¸",
1738
+ "ãĤĴçłĶãģİæ¾Ħãģ"
1739
+ ],
1740
+ [
1741
+ "ãĤĴè¨",
1742
+ "İãģ¤ãģ®ãģ¯åĪĥãģł"
1743
+ ],
1744
+ [
1745
+ "ãĤĴè£Ĥ",
1746
+ "ãģij"
1747
+ ],
1748
+ [
1749
+ "ãģ®è²¬å",
1750
+ "ĭĻ"
1751
+ ],
1752
+ [
1753
+ "ãģijãģĺãĤ",
1754
+ "ĥãģªãģĦ"
1755
+ ],
1756
+ [
1757
+ "Ġ決",
1758
+ "ãģĹãģ¦è«¦ãĤģãĤĭãģª"
1759
+ ],
1760
+ [
1761
+ "Ġæĸ¬æ",
1762
+ "ĴĥãĤĴéĩįãģŃãĤį"
1763
+ ],
1764
+ [
1765
+ "ĠæŁ±ãģ",
1766
+ "¨ã��Ĺãģ¦"
1767
+ ],
1768
+ [
1769
+ "ãģ¯ç¶ļ",
1770
+ "ãģĦãģ¦"
1771
+ ],
1772
+ [
1773
+ "Ġ風",
1774
+ "ãģ®åŀĭ"
1775
+ ],
1776
+ [
1777
+ "Ġ鬼",
1778
+ "ãĤĴè¨İãģ¤ãģ®ãģ¯åĪĥãģł"
1779
+ ],
1780
+ [
1781
+ "ĠéĹĩãĤĴé",
1782
+ "§ĨãģijãĤį"
1783
+ ],
1784
+ [
1785
+ "ãģłãģĭãĤī",
1786
+ "ãģĵãģĿå¼·ãģ"
1787
+ ],
1788
+ [
1789
+ "åIJijãģijãĤĭ",
1790
+ "ãģĵãģ¨ãģ¯"
1791
+ ],
1792
+ [
1793
+ "æĬĢãĤĴç",
1794
+ "£¨ãģij"
1795
+ ],
1796
+ [
1797
+ "Ġ稲",
1798
+ "妻ãģ®ãģĶãģ¨ãģ"
1799
+ ],
1800
+ [
1801
+ "ĠçĤİ",
1802
+ "ãģ®åŀĭ"
1803
+ ],
1804
+ [
1805
+ "ãĤĤãģ¾ãģ",
1806
+ "ŁåĪĥãģł"
1807
+ ],
1808
+ [
1809
+ "ãĤĴæĸŃ",
1810
+ "ãģ¡åĪĩãĤĮ"
1811
+ ],
1812
+ [
1813
+ "ä»Ĭãģ",
1814
+ "ĵãģ®çŀ¬éĸĵãģ«åij"
1815
+ ],
1816
+ [
1817
+ "ä½ķ度ãģ",
1818
+ "§ãĤĤç«ĭ"
1819
+ ],
1820
+ [
1821
+ "åij¼åIJ¸",
1822
+ "ãģ¯ç¶ļãģĦãģ¦"
1823
+ ],
1824
+ [
1825
+ "許ãģķ",
1826
+ "ãĤĮãģªãģĦ"
1827
+ ],
1828
+ [
1829
+ "Ġå¼±ãģķ",
1830
+ "ãĤĴçŁ¥ãĤĮ"
1831
+ ],
1832
+ [
1833
+ "æĬĺãĤĮãĤĭãģ®ãģ¯",
1834
+ "è¦ļæĤŁãģ®"
1835
+ ],
1836
+ [
1837
+ "æģIJãĤĮ",
1838
+ "ãĤĴæĸŃãģ¡åĪĩãĤĮ"
1839
+ ],
1840
+ [
1841
+ "æĦıå¿Ĺ",
1842
+ "ãĤĤãģ¾ãģŁåĪĥãģł"
1843
+ ],
1844
+ [
1845
+ "èĥĮãĤĴ",
1846
+ "åIJijãģijãĤĭãģĵãģ¨ãģ¯"
1847
+ ],
1848
+ [
1849
+ "Ġ仲éĸĵãĤĴ",
1850
+ "å®ĪãĤĭ"
1851
+ ],
1852
+ [
1853
+ "Ġãģ¿ãģªãĤĤ",
1854
+ "ãĤĴè£Ĥãģij"
1855
+ ],
1856
+ [
1857
+ "ãģĿãģ®ãģŁãĤģãģªãĤī",
1858
+ "ä½ķ度ãģ§ãĤĤç«ĭ"
1859
+ ],
1860
+ [
1861
+ "ĠåĨĨãĤĴæıı",
1862
+ "ãģij"
1863
+ ],
1864
+ [
1865
+ "Ġåij¼åIJ¸ãĤĴçłĶãģİæ¾Ħãģ",
1866
+ "¾ãģĽ"
1867
+ ],
1868
+ [
1869
+ "ĠæŁ±ãģ¨ãģĹãģ¦",
1870
+ "ãģ®è²¬åĭĻ"
1871
+ ],
1872
+ [
1873
+ "Ġ鬼ãĤĴè¨İãģ¤ãģ®ãģ¯åĪĥãģł",
1874
+ "ãģijãģĺãĤĥãģªãģĦ"
1875
+ ],
1876
+ [
1877
+ "ãģłãģĭãĤīãģĵãģĿå¼·ãģ",
1878
+ "ķãģĮ宿ãĤĭ"
1879
+ ],
1880
+ [
1881
+ "Ġ稲妻ãģ®ãģĶãģ¨ãģ",
1882
+ "ıè¸ıãģ¿è¾¼ãĤģ"
1883
+ ],
1884
+ [
1885
+ "ä»Ĭãģĵãģ®çŀ¬éĸĵãģ«åij",
1886
+ "½ãĤĴæĩ¸ãģijãĤĭ"
1887
+ ],
1888
+ [
1889
+ "åij¼åIJ¸ãģ¯ç¶ļãģĦãģ¦",
1890
+ "ãģĦãĤĭ"
1891
+ ],
1892
+ [
1893
+ "æĬĺãĤĮãĤĭãģ®ãģ¯è¦ļæĤŁãģ®",
1894
+ "æĸ¹ãģł"
1895
+ ],
1896
+ [
1897
+ "èĥĮãĤĴåIJijãģijãĤĭãģĵãģ¨ãģ¯",
1898
+ "許ãģķãĤĮãģªãģĦ"
1899
+ ],
1900
+ [
1901
+ "ãģĿãģ®ãģŁãĤģãģªãĤīä½ķ度ãģ§ãĤĤç«ĭ",
1902
+ "ãģ¤"
1903
+ ]
1904
+ ]
1905
+ }
1906
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ }
35
+ },
36
+ "bos_token": "<s>",
37
+ "clean_up_tokenization_spaces": false,
38
+ "eos_token": "</s>",
39
+ "extra_special_tokens": {},
40
+ "model_max_length": 1000000000000000019884624838656,
41
+ "pad_token": "<pad>",
42
+ "tokenizer_class": "PreTrainedTokenizerFast",
43
+ "unk_token": "<unk>"
44
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b761e97981f33bde7c70dfe5c9b438eac49034f1648cbdce0a9a315b71b86e5
3
+ size 5777