Ba2han commited on
Commit
6e21fd9
·
1 Parent(s): 0ee5d75

Training in progress, step 315, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -10,69 +10,61 @@
10
  "bos_token_id": 50030,
11
  "dtype": "bfloat16",
12
  "eos_token_id": 50031,
13
- "head_dim": 64,
14
  "hidden_act": "silu",
15
  "hidden_size": 1152,
16
  "initializer_range": 0.02,
17
- "intermediate_size": 2880,
18
  "layer_types": [
19
  "full_attention",
 
20
  "full_attention",
 
21
  "full_attention",
 
22
  "full_attention",
 
23
  "full_attention",
 
24
  "full_attention",
 
25
  "full_attention",
 
26
  "full_attention",
 
27
  "full_attention",
 
28
  "full_attention",
 
29
  "full_attention",
 
30
  "full_attention",
 
31
  "full_attention",
 
32
  "full_attention",
 
33
  "full_attention",
 
34
  "full_attention",
 
35
  "full_attention",
 
36
  "full_attention",
 
37
  "full_attention",
 
38
  "full_attention",
39
- "full_attention",
40
- "full_attention",
41
- "full_attention",
42
- "full_attention",
43
- "full_attention",
44
- "full_attention",
45
- "full_attention",
46
- "full_attention",
47
- "full_attention",
48
- "full_attention",
49
- "full_attention",
50
- "full_attention",
51
- "full_attention",
52
- "full_attention",
53
- "full_attention",
54
- "full_attention",
55
- "full_attention",
56
- "full_attention",
57
- "full_attention",
58
- "full_attention",
59
- "full_attention",
60
- "full_attention",
61
- "full_attention",
62
- "full_attention",
63
- "full_attention",
64
- "full_attention",
65
- "full_attention",
66
- "full_attention"
67
  ],
68
  "max_position_embeddings": 8192,
69
- "max_window_layers": 48,
70
  "mlp_type": "squared_relu",
71
- "model_name": "test_checkpoint",
72
  "model_type": "qwen3",
73
- "n_layer": 48,
74
  "num_attention_heads": 16,
75
- "num_hidden_layers": 48,
76
  "num_key_value_heads": 4,
77
  "pad_token_id": 50034,
78
  "rms_norm_eps": 1e-06,
@@ -80,13 +72,13 @@
80
  "rope_theta": 50000,
81
  "rope_type": "default"
82
  },
83
- "sliding_window": null,
84
  "squared_relu_activation": "relu2",
85
- "squared_relu_intermediate_size": 2880,
86
- "tie_word_embeddings": false,
87
- "transformers_version": "5.7.0",
88
- "unsloth_version": "2026.4.8",
89
  "use_cache": false,
90
- "use_sliding_window": false,
91
- "vocab_size": 50048
92
  }
 
10
  "bos_token_id": 50030,
11
  "dtype": "bfloat16",
12
  "eos_token_id": 50031,
13
+ "head_dim": 128,
14
  "hidden_act": "silu",
15
  "hidden_size": 1152,
16
  "initializer_range": 0.02,
17
+ "intermediate_size": 3168,
18
  "layer_types": [
19
  "full_attention",
20
+ "sliding_attention",
21
  "full_attention",
22
+ "sliding_attention",
23
  "full_attention",
24
+ "sliding_attention",
25
  "full_attention",
26
+ "sliding_attention",
27
  "full_attention",
28
+ "sliding_attention",
29
  "full_attention",
30
+ "sliding_attention",
31
  "full_attention",
32
+ "sliding_attention",
33
  "full_attention",
34
+ "sliding_attention",
35
  "full_attention",
36
+ "sliding_attention",
37
  "full_attention",
38
+ "sliding_attention",
39
  "full_attention",
40
+ "sliding_attention",
41
  "full_attention",
42
+ "sliding_attention",
43
  "full_attention",
44
+ "sliding_attention",
45
  "full_attention",
46
+ "sliding_attention",
47
  "full_attention",
48
+ "sliding_attention",
49
  "full_attention",
50
+ "sliding_attention",
51
  "full_attention",
52
+ "sliding_attention",
53
  "full_attention",
54
+ "sliding_attention",
55
  "full_attention",
56
+ "sliding_attention",
57
  "full_attention",
58
+ "sliding_attention"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59
  ],
60
  "max_position_embeddings": 8192,
61
+ "max_window_layers": 40,
62
  "mlp_type": "squared_relu",
63
+ "model_name": "qwen3-canon-padded",
64
  "model_type": "qwen3",
65
+ "n_layer": 40,
66
  "num_attention_heads": 16,
67
+ "num_hidden_layers": 40,
68
  "num_key_value_heads": 4,
69
  "pad_token_id": 50034,
70
  "rms_norm_eps": 1e-06,
 
72
  "rope_theta": 50000,
73
  "rope_type": "default"
74
  },
75
+ "sliding_window": 4096,
76
  "squared_relu_activation": "relu2",
77
+ "squared_relu_intermediate_size": 3168,
78
+ "tie_word_embeddings": true,
79
+ "transformers_version": "5.5.0",
80
+ "unsloth_version": "2026.5.2",
81
  "use_cache": false,
82
+ "use_sliding_window": true,
83
+ "vocab_size": 50304
84
  }
last-checkpoint/generation_config.json CHANGED
@@ -8,6 +8,6 @@
8
  "output_attentions": false,
9
  "output_hidden_states": false,
10
  "pad_token_id": 50034,
11
- "transformers_version": "5.7.0",
12
  "use_cache": false
13
  }
 
8
  "output_attentions": false,
9
  "output_hidden_states": false,
10
  "pad_token_id": 50034,
11
+ "transformers_version": "5.5.0",
12
  "use_cache": false
13
  }
last-checkpoint/tokenizer.json CHANGED
@@ -164,6 +164,2310 @@
164
  "rstrip": false,
165
  "normalized": false,
166
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
167
  }
168
  ],
169
  "normalizer": null,
 
164
  "rstrip": false,
165
  "normalized": false,
166
  "special": true
167
+ },
168
+ {
169
+ "id": 50048,
170
+ "content": "<|pad_token[0]|>",
171
+ "single_word": false,
172
+ "lstrip": false,
173
+ "rstrip": false,
174
+ "normalized": false,
175
+ "special": true
176
+ },
177
+ {
178
+ "id": 50049,
179
+ "content": "<|pad_token[1]|>",
180
+ "single_word": false,
181
+ "lstrip": false,
182
+ "rstrip": false,
183
+ "normalized": false,
184
+ "special": true
185
+ },
186
+ {
187
+ "id": 50050,
188
+ "content": "<|pad_token[2]|>",
189
+ "single_word": false,
190
+ "lstrip": false,
191
+ "rstrip": false,
192
+ "normalized": false,
193
+ "special": true
194
+ },
195
+ {
196
+ "id": 50051,
197
+ "content": "<|pad_token[3]|>",
198
+ "single_word": false,
199
+ "lstrip": false,
200
+ "rstrip": false,
201
+ "normalized": false,
202
+ "special": true
203
+ },
204
+ {
205
+ "id": 50052,
206
+ "content": "<|pad_token[4]|>",
207
+ "single_word": false,
208
+ "lstrip": false,
209
+ "rstrip": false,
210
+ "normalized": false,
211
+ "special": true
212
+ },
213
+ {
214
+ "id": 50053,
215
+ "content": "<|pad_token[5]|>",
216
+ "single_word": false,
217
+ "lstrip": false,
218
+ "rstrip": false,
219
+ "normalized": false,
220
+ "special": true
221
+ },
222
+ {
223
+ "id": 50054,
224
+ "content": "<|pad_token[6]|>",
225
+ "single_word": false,
226
+ "lstrip": false,
227
+ "rstrip": false,
228
+ "normalized": false,
229
+ "special": true
230
+ },
231
+ {
232
+ "id": 50055,
233
+ "content": "<|pad_token[7]|>",
234
+ "single_word": false,
235
+ "lstrip": false,
236
+ "rstrip": false,
237
+ "normalized": false,
238
+ "special": true
239
+ },
240
+ {
241
+ "id": 50056,
242
+ "content": "<|pad_token[8]|>",
243
+ "single_word": false,
244
+ "lstrip": false,
245
+ "rstrip": false,
246
+ "normalized": false,
247
+ "special": true
248
+ },
249
+ {
250
+ "id": 50057,
251
+ "content": "<|pad_token[9]|>",
252
+ "single_word": false,
253
+ "lstrip": false,
254
+ "rstrip": false,
255
+ "normalized": false,
256
+ "special": true
257
+ },
258
+ {
259
+ "id": 50058,
260
+ "content": "<|pad_token[10]|>",
261
+ "single_word": false,
262
+ "lstrip": false,
263
+ "rstrip": false,
264
+ "normalized": false,
265
+ "special": true
266
+ },
267
+ {
268
+ "id": 50059,
269
+ "content": "<|pad_token[11]|>",
270
+ "single_word": false,
271
+ "lstrip": false,
272
+ "rstrip": false,
273
+ "normalized": false,
274
+ "special": true
275
+ },
276
+ {
277
+ "id": 50060,
278
+ "content": "<|pad_token[12]|>",
279
+ "single_word": false,
280
+ "lstrip": false,
281
+ "rstrip": false,
282
+ "normalized": false,
283
+ "special": true
284
+ },
285
+ {
286
+ "id": 50061,
287
+ "content": "<|pad_token[13]|>",
288
+ "single_word": false,
289
+ "lstrip": false,
290
+ "rstrip": false,
291
+ "normalized": false,
292
+ "special": true
293
+ },
294
+ {
295
+ "id": 50062,
296
+ "content": "<|pad_token[14]|>",
297
+ "single_word": false,
298
+ "lstrip": false,
299
+ "rstrip": false,
300
+ "normalized": false,
301
+ "special": true
302
+ },
303
+ {
304
+ "id": 50063,
305
+ "content": "<|pad_token[15]|>",
306
+ "single_word": false,
307
+ "lstrip": false,
308
+ "rstrip": false,
309
+ "normalized": false,
310
+ "special": true
311
+ },
312
+ {
313
+ "id": 50064,
314
+ "content": "<|pad_token[16]|>",
315
+ "single_word": false,
316
+ "lstrip": false,
317
+ "rstrip": false,
318
+ "normalized": false,
319
+ "special": true
320
+ },
321
+ {
322
+ "id": 50065,
323
+ "content": "<|pad_token[17]|>",
324
+ "single_word": false,
325
+ "lstrip": false,
326
+ "rstrip": false,
327
+ "normalized": false,
328
+ "special": true
329
+ },
330
+ {
331
+ "id": 50066,
332
+ "content": "<|pad_token[18]|>",
333
+ "single_word": false,
334
+ "lstrip": false,
335
+ "rstrip": false,
336
+ "normalized": false,
337
+ "special": true
338
+ },
339
+ {
340
+ "id": 50067,
341
+ "content": "<|pad_token[19]|>",
342
+ "single_word": false,
343
+ "lstrip": false,
344
+ "rstrip": false,
345
+ "normalized": false,
346
+ "special": true
347
+ },
348
+ {
349
+ "id": 50068,
350
+ "content": "<|pad_token[20]|>",
351
+ "single_word": false,
352
+ "lstrip": false,
353
+ "rstrip": false,
354
+ "normalized": false,
355
+ "special": true
356
+ },
357
+ {
358
+ "id": 50069,
359
+ "content": "<|pad_token[21]|>",
360
+ "single_word": false,
361
+ "lstrip": false,
362
+ "rstrip": false,
363
+ "normalized": false,
364
+ "special": true
365
+ },
366
+ {
367
+ "id": 50070,
368
+ "content": "<|pad_token[22]|>",
369
+ "single_word": false,
370
+ "lstrip": false,
371
+ "rstrip": false,
372
+ "normalized": false,
373
+ "special": true
374
+ },
375
+ {
376
+ "id": 50071,
377
+ "content": "<|pad_token[23]|>",
378
+ "single_word": false,
379
+ "lstrip": false,
380
+ "rstrip": false,
381
+ "normalized": false,
382
+ "special": true
383
+ },
384
+ {
385
+ "id": 50072,
386
+ "content": "<|pad_token[24]|>",
387
+ "single_word": false,
388
+ "lstrip": false,
389
+ "rstrip": false,
390
+ "normalized": false,
391
+ "special": true
392
+ },
393
+ {
394
+ "id": 50073,
395
+ "content": "<|pad_token[25]|>",
396
+ "single_word": false,
397
+ "lstrip": false,
398
+ "rstrip": false,
399
+ "normalized": false,
400
+ "special": true
401
+ },
402
+ {
403
+ "id": 50074,
404
+ "content": "<|pad_token[26]|>",
405
+ "single_word": false,
406
+ "lstrip": false,
407
+ "rstrip": false,
408
+ "normalized": false,
409
+ "special": true
410
+ },
411
+ {
412
+ "id": 50075,
413
+ "content": "<|pad_token[27]|>",
414
+ "single_word": false,
415
+ "lstrip": false,
416
+ "rstrip": false,
417
+ "normalized": false,
418
+ "special": true
419
+ },
420
+ {
421
+ "id": 50076,
422
+ "content": "<|pad_token[28]|>",
423
+ "single_word": false,
424
+ "lstrip": false,
425
+ "rstrip": false,
426
+ "normalized": false,
427
+ "special": true
428
+ },
429
+ {
430
+ "id": 50077,
431
+ "content": "<|pad_token[29]|>",
432
+ "single_word": false,
433
+ "lstrip": false,
434
+ "rstrip": false,
435
+ "normalized": false,
436
+ "special": true
437
+ },
438
+ {
439
+ "id": 50078,
440
+ "content": "<|pad_token[30]|>",
441
+ "single_word": false,
442
+ "lstrip": false,
443
+ "rstrip": false,
444
+ "normalized": false,
445
+ "special": true
446
+ },
447
+ {
448
+ "id": 50079,
449
+ "content": "<|pad_token[31]|>",
450
+ "single_word": false,
451
+ "lstrip": false,
452
+ "rstrip": false,
453
+ "normalized": false,
454
+ "special": true
455
+ },
456
+ {
457
+ "id": 50080,
458
+ "content": "<|pad_token[32]|>",
459
+ "single_word": false,
460
+ "lstrip": false,
461
+ "rstrip": false,
462
+ "normalized": false,
463
+ "special": true
464
+ },
465
+ {
466
+ "id": 50081,
467
+ "content": "<|pad_token[33]|>",
468
+ "single_word": false,
469
+ "lstrip": false,
470
+ "rstrip": false,
471
+ "normalized": false,
472
+ "special": true
473
+ },
474
+ {
475
+ "id": 50082,
476
+ "content": "<|pad_token[34]|>",
477
+ "single_word": false,
478
+ "lstrip": false,
479
+ "rstrip": false,
480
+ "normalized": false,
481
+ "special": true
482
+ },
483
+ {
484
+ "id": 50083,
485
+ "content": "<|pad_token[35]|>",
486
+ "single_word": false,
487
+ "lstrip": false,
488
+ "rstrip": false,
489
+ "normalized": false,
490
+ "special": true
491
+ },
492
+ {
493
+ "id": 50084,
494
+ "content": "<|pad_token[36]|>",
495
+ "single_word": false,
496
+ "lstrip": false,
497
+ "rstrip": false,
498
+ "normalized": false,
499
+ "special": true
500
+ },
501
+ {
502
+ "id": 50085,
503
+ "content": "<|pad_token[37]|>",
504
+ "single_word": false,
505
+ "lstrip": false,
506
+ "rstrip": false,
507
+ "normalized": false,
508
+ "special": true
509
+ },
510
+ {
511
+ "id": 50086,
512
+ "content": "<|pad_token[38]|>",
513
+ "single_word": false,
514
+ "lstrip": false,
515
+ "rstrip": false,
516
+ "normalized": false,
517
+ "special": true
518
+ },
519
+ {
520
+ "id": 50087,
521
+ "content": "<|pad_token[39]|>",
522
+ "single_word": false,
523
+ "lstrip": false,
524
+ "rstrip": false,
525
+ "normalized": false,
526
+ "special": true
527
+ },
528
+ {
529
+ "id": 50088,
530
+ "content": "<|pad_token[40]|>",
531
+ "single_word": false,
532
+ "lstrip": false,
533
+ "rstrip": false,
534
+ "normalized": false,
535
+ "special": true
536
+ },
537
+ {
538
+ "id": 50089,
539
+ "content": "<|pad_token[41]|>",
540
+ "single_word": false,
541
+ "lstrip": false,
542
+ "rstrip": false,
543
+ "normalized": false,
544
+ "special": true
545
+ },
546
+ {
547
+ "id": 50090,
548
+ "content": "<|pad_token[42]|>",
549
+ "single_word": false,
550
+ "lstrip": false,
551
+ "rstrip": false,
552
+ "normalized": false,
553
+ "special": true
554
+ },
555
+ {
556
+ "id": 50091,
557
+ "content": "<|pad_token[43]|>",
558
+ "single_word": false,
559
+ "lstrip": false,
560
+ "rstrip": false,
561
+ "normalized": false,
562
+ "special": true
563
+ },
564
+ {
565
+ "id": 50092,
566
+ "content": "<|pad_token[44]|>",
567
+ "single_word": false,
568
+ "lstrip": false,
569
+ "rstrip": false,
570
+ "normalized": false,
571
+ "special": true
572
+ },
573
+ {
574
+ "id": 50093,
575
+ "content": "<|pad_token[45]|>",
576
+ "single_word": false,
577
+ "lstrip": false,
578
+ "rstrip": false,
579
+ "normalized": false,
580
+ "special": true
581
+ },
582
+ {
583
+ "id": 50094,
584
+ "content": "<|pad_token[46]|>",
585
+ "single_word": false,
586
+ "lstrip": false,
587
+ "rstrip": false,
588
+ "normalized": false,
589
+ "special": true
590
+ },
591
+ {
592
+ "id": 50095,
593
+ "content": "<|pad_token[47]|>",
594
+ "single_word": false,
595
+ "lstrip": false,
596
+ "rstrip": false,
597
+ "normalized": false,
598
+ "special": true
599
+ },
600
+ {
601
+ "id": 50096,
602
+ "content": "<|pad_token[48]|>",
603
+ "single_word": false,
604
+ "lstrip": false,
605
+ "rstrip": false,
606
+ "normalized": false,
607
+ "special": true
608
+ },
609
+ {
610
+ "id": 50097,
611
+ "content": "<|pad_token[49]|>",
612
+ "single_word": false,
613
+ "lstrip": false,
614
+ "rstrip": false,
615
+ "normalized": false,
616
+ "special": true
617
+ },
618
+ {
619
+ "id": 50098,
620
+ "content": "<|pad_token[50]|>",
621
+ "single_word": false,
622
+ "lstrip": false,
623
+ "rstrip": false,
624
+ "normalized": false,
625
+ "special": true
626
+ },
627
+ {
628
+ "id": 50099,
629
+ "content": "<|pad_token[51]|>",
630
+ "single_word": false,
631
+ "lstrip": false,
632
+ "rstrip": false,
633
+ "normalized": false,
634
+ "special": true
635
+ },
636
+ {
637
+ "id": 50100,
638
+ "content": "<|pad_token[52]|>",
639
+ "single_word": false,
640
+ "lstrip": false,
641
+ "rstrip": false,
642
+ "normalized": false,
643
+ "special": true
644
+ },
645
+ {
646
+ "id": 50101,
647
+ "content": "<|pad_token[53]|>",
648
+ "single_word": false,
649
+ "lstrip": false,
650
+ "rstrip": false,
651
+ "normalized": false,
652
+ "special": true
653
+ },
654
+ {
655
+ "id": 50102,
656
+ "content": "<|pad_token[54]|>",
657
+ "single_word": false,
658
+ "lstrip": false,
659
+ "rstrip": false,
660
+ "normalized": false,
661
+ "special": true
662
+ },
663
+ {
664
+ "id": 50103,
665
+ "content": "<|pad_token[55]|>",
666
+ "single_word": false,
667
+ "lstrip": false,
668
+ "rstrip": false,
669
+ "normalized": false,
670
+ "special": true
671
+ },
672
+ {
673
+ "id": 50104,
674
+ "content": "<|pad_token[56]|>",
675
+ "single_word": false,
676
+ "lstrip": false,
677
+ "rstrip": false,
678
+ "normalized": false,
679
+ "special": true
680
+ },
681
+ {
682
+ "id": 50105,
683
+ "content": "<|pad_token[57]|>",
684
+ "single_word": false,
685
+ "lstrip": false,
686
+ "rstrip": false,
687
+ "normalized": false,
688
+ "special": true
689
+ },
690
+ {
691
+ "id": 50106,
692
+ "content": "<|pad_token[58]|>",
693
+ "single_word": false,
694
+ "lstrip": false,
695
+ "rstrip": false,
696
+ "normalized": false,
697
+ "special": true
698
+ },
699
+ {
700
+ "id": 50107,
701
+ "content": "<|pad_token[59]|>",
702
+ "single_word": false,
703
+ "lstrip": false,
704
+ "rstrip": false,
705
+ "normalized": false,
706
+ "special": true
707
+ },
708
+ {
709
+ "id": 50108,
710
+ "content": "<|pad_token[60]|>",
711
+ "single_word": false,
712
+ "lstrip": false,
713
+ "rstrip": false,
714
+ "normalized": false,
715
+ "special": true
716
+ },
717
+ {
718
+ "id": 50109,
719
+ "content": "<|pad_token[61]|>",
720
+ "single_word": false,
721
+ "lstrip": false,
722
+ "rstrip": false,
723
+ "normalized": false,
724
+ "special": true
725
+ },
726
+ {
727
+ "id": 50110,
728
+ "content": "<|pad_token[62]|>",
729
+ "single_word": false,
730
+ "lstrip": false,
731
+ "rstrip": false,
732
+ "normalized": false,
733
+ "special": true
734
+ },
735
+ {
736
+ "id": 50111,
737
+ "content": "<|pad_token[63]|>",
738
+ "single_word": false,
739
+ "lstrip": false,
740
+ "rstrip": false,
741
+ "normalized": false,
742
+ "special": true
743
+ },
744
+ {
745
+ "id": 50112,
746
+ "content": "<|pad_token[64]|>",
747
+ "single_word": false,
748
+ "lstrip": false,
749
+ "rstrip": false,
750
+ "normalized": false,
751
+ "special": true
752
+ },
753
+ {
754
+ "id": 50113,
755
+ "content": "<|pad_token[65]|>",
756
+ "single_word": false,
757
+ "lstrip": false,
758
+ "rstrip": false,
759
+ "normalized": false,
760
+ "special": true
761
+ },
762
+ {
763
+ "id": 50114,
764
+ "content": "<|pad_token[66]|>",
765
+ "single_word": false,
766
+ "lstrip": false,
767
+ "rstrip": false,
768
+ "normalized": false,
769
+ "special": true
770
+ },
771
+ {
772
+ "id": 50115,
773
+ "content": "<|pad_token[67]|>",
774
+ "single_word": false,
775
+ "lstrip": false,
776
+ "rstrip": false,
777
+ "normalized": false,
778
+ "special": true
779
+ },
780
+ {
781
+ "id": 50116,
782
+ "content": "<|pad_token[68]|>",
783
+ "single_word": false,
784
+ "lstrip": false,
785
+ "rstrip": false,
786
+ "normalized": false,
787
+ "special": true
788
+ },
789
+ {
790
+ "id": 50117,
791
+ "content": "<|pad_token[69]|>",
792
+ "single_word": false,
793
+ "lstrip": false,
794
+ "rstrip": false,
795
+ "normalized": false,
796
+ "special": true
797
+ },
798
+ {
799
+ "id": 50118,
800
+ "content": "<|pad_token[70]|>",
801
+ "single_word": false,
802
+ "lstrip": false,
803
+ "rstrip": false,
804
+ "normalized": false,
805
+ "special": true
806
+ },
807
+ {
808
+ "id": 50119,
809
+ "content": "<|pad_token[71]|>",
810
+ "single_word": false,
811
+ "lstrip": false,
812
+ "rstrip": false,
813
+ "normalized": false,
814
+ "special": true
815
+ },
816
+ {
817
+ "id": 50120,
818
+ "content": "<|pad_token[72]|>",
819
+ "single_word": false,
820
+ "lstrip": false,
821
+ "rstrip": false,
822
+ "normalized": false,
823
+ "special": true
824
+ },
825
+ {
826
+ "id": 50121,
827
+ "content": "<|pad_token[73]|>",
828
+ "single_word": false,
829
+ "lstrip": false,
830
+ "rstrip": false,
831
+ "normalized": false,
832
+ "special": true
833
+ },
834
+ {
835
+ "id": 50122,
836
+ "content": "<|pad_token[74]|>",
837
+ "single_word": false,
838
+ "lstrip": false,
839
+ "rstrip": false,
840
+ "normalized": false,
841
+ "special": true
842
+ },
843
+ {
844
+ "id": 50123,
845
+ "content": "<|pad_token[75]|>",
846
+ "single_word": false,
847
+ "lstrip": false,
848
+ "rstrip": false,
849
+ "normalized": false,
850
+ "special": true
851
+ },
852
+ {
853
+ "id": 50124,
854
+ "content": "<|pad_token[76]|>",
855
+ "single_word": false,
856
+ "lstrip": false,
857
+ "rstrip": false,
858
+ "normalized": false,
859
+ "special": true
860
+ },
861
+ {
862
+ "id": 50125,
863
+ "content": "<|pad_token[77]|>",
864
+ "single_word": false,
865
+ "lstrip": false,
866
+ "rstrip": false,
867
+ "normalized": false,
868
+ "special": true
869
+ },
870
+ {
871
+ "id": 50126,
872
+ "content": "<|pad_token[78]|>",
873
+ "single_word": false,
874
+ "lstrip": false,
875
+ "rstrip": false,
876
+ "normalized": false,
877
+ "special": true
878
+ },
879
+ {
880
+ "id": 50127,
881
+ "content": "<|pad_token[79]|>",
882
+ "single_word": false,
883
+ "lstrip": false,
884
+ "rstrip": false,
885
+ "normalized": false,
886
+ "special": true
887
+ },
888
+ {
889
+ "id": 50128,
890
+ "content": "<|pad_token[80]|>",
891
+ "single_word": false,
892
+ "lstrip": false,
893
+ "rstrip": false,
894
+ "normalized": false,
895
+ "special": true
896
+ },
897
+ {
898
+ "id": 50129,
899
+ "content": "<|pad_token[81]|>",
900
+ "single_word": false,
901
+ "lstrip": false,
902
+ "rstrip": false,
903
+ "normalized": false,
904
+ "special": true
905
+ },
906
+ {
907
+ "id": 50130,
908
+ "content": "<|pad_token[82]|>",
909
+ "single_word": false,
910
+ "lstrip": false,
911
+ "rstrip": false,
912
+ "normalized": false,
913
+ "special": true
914
+ },
915
+ {
916
+ "id": 50131,
917
+ "content": "<|pad_token[83]|>",
918
+ "single_word": false,
919
+ "lstrip": false,
920
+ "rstrip": false,
921
+ "normalized": false,
922
+ "special": true
923
+ },
924
+ {
925
+ "id": 50132,
926
+ "content": "<|pad_token[84]|>",
927
+ "single_word": false,
928
+ "lstrip": false,
929
+ "rstrip": false,
930
+ "normalized": false,
931
+ "special": true
932
+ },
933
+ {
934
+ "id": 50133,
935
+ "content": "<|pad_token[85]|>",
936
+ "single_word": false,
937
+ "lstrip": false,
938
+ "rstrip": false,
939
+ "normalized": false,
940
+ "special": true
941
+ },
942
+ {
943
+ "id": 50134,
944
+ "content": "<|pad_token[86]|>",
945
+ "single_word": false,
946
+ "lstrip": false,
947
+ "rstrip": false,
948
+ "normalized": false,
949
+ "special": true
950
+ },
951
+ {
952
+ "id": 50135,
953
+ "content": "<|pad_token[87]|>",
954
+ "single_word": false,
955
+ "lstrip": false,
956
+ "rstrip": false,
957
+ "normalized": false,
958
+ "special": true
959
+ },
960
+ {
961
+ "id": 50136,
962
+ "content": "<|pad_token[88]|>",
963
+ "single_word": false,
964
+ "lstrip": false,
965
+ "rstrip": false,
966
+ "normalized": false,
967
+ "special": true
968
+ },
969
+ {
970
+ "id": 50137,
971
+ "content": "<|pad_token[89]|>",
972
+ "single_word": false,
973
+ "lstrip": false,
974
+ "rstrip": false,
975
+ "normalized": false,
976
+ "special": true
977
+ },
978
+ {
979
+ "id": 50138,
980
+ "content": "<|pad_token[90]|>",
981
+ "single_word": false,
982
+ "lstrip": false,
983
+ "rstrip": false,
984
+ "normalized": false,
985
+ "special": true
986
+ },
987
+ {
988
+ "id": 50139,
989
+ "content": "<|pad_token[91]|>",
990
+ "single_word": false,
991
+ "lstrip": false,
992
+ "rstrip": false,
993
+ "normalized": false,
994
+ "special": true
995
+ },
996
+ {
997
+ "id": 50140,
998
+ "content": "<|pad_token[92]|>",
999
+ "single_word": false,
1000
+ "lstrip": false,
1001
+ "rstrip": false,
1002
+ "normalized": false,
1003
+ "special": true
1004
+ },
1005
+ {
1006
+ "id": 50141,
1007
+ "content": "<|pad_token[93]|>",
1008
+ "single_word": false,
1009
+ "lstrip": false,
1010
+ "rstrip": false,
1011
+ "normalized": false,
1012
+ "special": true
1013
+ },
1014
+ {
1015
+ "id": 50142,
1016
+ "content": "<|pad_token[94]|>",
1017
+ "single_word": false,
1018
+ "lstrip": false,
1019
+ "rstrip": false,
1020
+ "normalized": false,
1021
+ "special": true
1022
+ },
1023
+ {
1024
+ "id": 50143,
1025
+ "content": "<|pad_token[95]|>",
1026
+ "single_word": false,
1027
+ "lstrip": false,
1028
+ "rstrip": false,
1029
+ "normalized": false,
1030
+ "special": true
1031
+ },
1032
+ {
1033
+ "id": 50144,
1034
+ "content": "<|pad_token[96]|>",
1035
+ "single_word": false,
1036
+ "lstrip": false,
1037
+ "rstrip": false,
1038
+ "normalized": false,
1039
+ "special": true
1040
+ },
1041
+ {
1042
+ "id": 50145,
1043
+ "content": "<|pad_token[97]|>",
1044
+ "single_word": false,
1045
+ "lstrip": false,
1046
+ "rstrip": false,
1047
+ "normalized": false,
1048
+ "special": true
1049
+ },
1050
+ {
1051
+ "id": 50146,
1052
+ "content": "<|pad_token[98]|>",
1053
+ "single_word": false,
1054
+ "lstrip": false,
1055
+ "rstrip": false,
1056
+ "normalized": false,
1057
+ "special": true
1058
+ },
1059
+ {
1060
+ "id": 50147,
1061
+ "content": "<|pad_token[99]|>",
1062
+ "single_word": false,
1063
+ "lstrip": false,
1064
+ "rstrip": false,
1065
+ "normalized": false,
1066
+ "special": true
1067
+ },
1068
+ {
1069
+ "id": 50148,
1070
+ "content": "<|pad_token[100]|>",
1071
+ "single_word": false,
1072
+ "lstrip": false,
1073
+ "rstrip": false,
1074
+ "normalized": false,
1075
+ "special": true
1076
+ },
1077
+ {
1078
+ "id": 50149,
1079
+ "content": "<|pad_token[101]|>",
1080
+ "single_word": false,
1081
+ "lstrip": false,
1082
+ "rstrip": false,
1083
+ "normalized": false,
1084
+ "special": true
1085
+ },
1086
+ {
1087
+ "id": 50150,
1088
+ "content": "<|pad_token[102]|>",
1089
+ "single_word": false,
1090
+ "lstrip": false,
1091
+ "rstrip": false,
1092
+ "normalized": false,
1093
+ "special": true
1094
+ },
1095
+ {
1096
+ "id": 50151,
1097
+ "content": "<|pad_token[103]|>",
1098
+ "single_word": false,
1099
+ "lstrip": false,
1100
+ "rstrip": false,
1101
+ "normalized": false,
1102
+ "special": true
1103
+ },
1104
+ {
1105
+ "id": 50152,
1106
+ "content": "<|pad_token[104]|>",
1107
+ "single_word": false,
1108
+ "lstrip": false,
1109
+ "rstrip": false,
1110
+ "normalized": false,
1111
+ "special": true
1112
+ },
1113
+ {
1114
+ "id": 50153,
1115
+ "content": "<|pad_token[105]|>",
1116
+ "single_word": false,
1117
+ "lstrip": false,
1118
+ "rstrip": false,
1119
+ "normalized": false,
1120
+ "special": true
1121
+ },
1122
+ {
1123
+ "id": 50154,
1124
+ "content": "<|pad_token[106]|>",
1125
+ "single_word": false,
1126
+ "lstrip": false,
1127
+ "rstrip": false,
1128
+ "normalized": false,
1129
+ "special": true
1130
+ },
1131
+ {
1132
+ "id": 50155,
1133
+ "content": "<|pad_token[107]|>",
1134
+ "single_word": false,
1135
+ "lstrip": false,
1136
+ "rstrip": false,
1137
+ "normalized": false,
1138
+ "special": true
1139
+ },
1140
+ {
1141
+ "id": 50156,
1142
+ "content": "<|pad_token[108]|>",
1143
+ "single_word": false,
1144
+ "lstrip": false,
1145
+ "rstrip": false,
1146
+ "normalized": false,
1147
+ "special": true
1148
+ },
1149
+ {
1150
+ "id": 50157,
1151
+ "content": "<|pad_token[109]|>",
1152
+ "single_word": false,
1153
+ "lstrip": false,
1154
+ "rstrip": false,
1155
+ "normalized": false,
1156
+ "special": true
1157
+ },
1158
+ {
1159
+ "id": 50158,
1160
+ "content": "<|pad_token[110]|>",
1161
+ "single_word": false,
1162
+ "lstrip": false,
1163
+ "rstrip": false,
1164
+ "normalized": false,
1165
+ "special": true
1166
+ },
1167
+ {
1168
+ "id": 50159,
1169
+ "content": "<|pad_token[111]|>",
1170
+ "single_word": false,
1171
+ "lstrip": false,
1172
+ "rstrip": false,
1173
+ "normalized": false,
1174
+ "special": true
1175
+ },
1176
+ {
1177
+ "id": 50160,
1178
+ "content": "<|pad_token[112]|>",
1179
+ "single_word": false,
1180
+ "lstrip": false,
1181
+ "rstrip": false,
1182
+ "normalized": false,
1183
+ "special": true
1184
+ },
1185
+ {
1186
+ "id": 50161,
1187
+ "content": "<|pad_token[113]|>",
1188
+ "single_word": false,
1189
+ "lstrip": false,
1190
+ "rstrip": false,
1191
+ "normalized": false,
1192
+ "special": true
1193
+ },
1194
+ {
1195
+ "id": 50162,
1196
+ "content": "<|pad_token[114]|>",
1197
+ "single_word": false,
1198
+ "lstrip": false,
1199
+ "rstrip": false,
1200
+ "normalized": false,
1201
+ "special": true
1202
+ },
1203
+ {
1204
+ "id": 50163,
1205
+ "content": "<|pad_token[115]|>",
1206
+ "single_word": false,
1207
+ "lstrip": false,
1208
+ "rstrip": false,
1209
+ "normalized": false,
1210
+ "special": true
1211
+ },
1212
+ {
1213
+ "id": 50164,
1214
+ "content": "<|pad_token[116]|>",
1215
+ "single_word": false,
1216
+ "lstrip": false,
1217
+ "rstrip": false,
1218
+ "normalized": false,
1219
+ "special": true
1220
+ },
1221
+ {
1222
+ "id": 50165,
1223
+ "content": "<|pad_token[117]|>",
1224
+ "single_word": false,
1225
+ "lstrip": false,
1226
+ "rstrip": false,
1227
+ "normalized": false,
1228
+ "special": true
1229
+ },
1230
+ {
1231
+ "id": 50166,
1232
+ "content": "<|pad_token[118]|>",
1233
+ "single_word": false,
1234
+ "lstrip": false,
1235
+ "rstrip": false,
1236
+ "normalized": false,
1237
+ "special": true
1238
+ },
1239
+ {
1240
+ "id": 50167,
1241
+ "content": "<|pad_token[119]|>",
1242
+ "single_word": false,
1243
+ "lstrip": false,
1244
+ "rstrip": false,
1245
+ "normalized": false,
1246
+ "special": true
1247
+ },
1248
+ {
1249
+ "id": 50168,
1250
+ "content": "<|pad_token[120]|>",
1251
+ "single_word": false,
1252
+ "lstrip": false,
1253
+ "rstrip": false,
1254
+ "normalized": false,
1255
+ "special": true
1256
+ },
1257
+ {
1258
+ "id": 50169,
1259
+ "content": "<|pad_token[121]|>",
1260
+ "single_word": false,
1261
+ "lstrip": false,
1262
+ "rstrip": false,
1263
+ "normalized": false,
1264
+ "special": true
1265
+ },
1266
+ {
1267
+ "id": 50170,
1268
+ "content": "<|pad_token[122]|>",
1269
+ "single_word": false,
1270
+ "lstrip": false,
1271
+ "rstrip": false,
1272
+ "normalized": false,
1273
+ "special": true
1274
+ },
1275
+ {
1276
+ "id": 50171,
1277
+ "content": "<|pad_token[123]|>",
1278
+ "single_word": false,
1279
+ "lstrip": false,
1280
+ "rstrip": false,
1281
+ "normalized": false,
1282
+ "special": true
1283
+ },
1284
+ {
1285
+ "id": 50172,
1286
+ "content": "<|pad_token[124]|>",
1287
+ "single_word": false,
1288
+ "lstrip": false,
1289
+ "rstrip": false,
1290
+ "normalized": false,
1291
+ "special": true
1292
+ },
1293
+ {
1294
+ "id": 50173,
1295
+ "content": "<|pad_token[125]|>",
1296
+ "single_word": false,
1297
+ "lstrip": false,
1298
+ "rstrip": false,
1299
+ "normalized": false,
1300
+ "special": true
1301
+ },
1302
+ {
1303
+ "id": 50174,
1304
+ "content": "<|pad_token[126]|>",
1305
+ "single_word": false,
1306
+ "lstrip": false,
1307
+ "rstrip": false,
1308
+ "normalized": false,
1309
+ "special": true
1310
+ },
1311
+ {
1312
+ "id": 50175,
1313
+ "content": "<|pad_token[127]|>",
1314
+ "single_word": false,
1315
+ "lstrip": false,
1316
+ "rstrip": false,
1317
+ "normalized": false,
1318
+ "special": true
1319
+ },
1320
+ {
1321
+ "id": 50176,
1322
+ "content": "<|pad_token[128]|>",
1323
+ "single_word": false,
1324
+ "lstrip": false,
1325
+ "rstrip": false,
1326
+ "normalized": false,
1327
+ "special": true
1328
+ },
1329
+ {
1330
+ "id": 50177,
1331
+ "content": "<|pad_token[129]|>",
1332
+ "single_word": false,
1333
+ "lstrip": false,
1334
+ "rstrip": false,
1335
+ "normalized": false,
1336
+ "special": true
1337
+ },
1338
+ {
1339
+ "id": 50178,
1340
+ "content": "<|pad_token[130]|>",
1341
+ "single_word": false,
1342
+ "lstrip": false,
1343
+ "rstrip": false,
1344
+ "normalized": false,
1345
+ "special": true
1346
+ },
1347
+ {
1348
+ "id": 50179,
1349
+ "content": "<|pad_token[131]|>",
1350
+ "single_word": false,
1351
+ "lstrip": false,
1352
+ "rstrip": false,
1353
+ "normalized": false,
1354
+ "special": true
1355
+ },
1356
+ {
1357
+ "id": 50180,
1358
+ "content": "<|pad_token[132]|>",
1359
+ "single_word": false,
1360
+ "lstrip": false,
1361
+ "rstrip": false,
1362
+ "normalized": false,
1363
+ "special": true
1364
+ },
1365
+ {
1366
+ "id": 50181,
1367
+ "content": "<|pad_token[133]|>",
1368
+ "single_word": false,
1369
+ "lstrip": false,
1370
+ "rstrip": false,
1371
+ "normalized": false,
1372
+ "special": true
1373
+ },
1374
+ {
1375
+ "id": 50182,
1376
+ "content": "<|pad_token[134]|>",
1377
+ "single_word": false,
1378
+ "lstrip": false,
1379
+ "rstrip": false,
1380
+ "normalized": false,
1381
+ "special": true
1382
+ },
1383
+ {
1384
+ "id": 50183,
1385
+ "content": "<|pad_token[135]|>",
1386
+ "single_word": false,
1387
+ "lstrip": false,
1388
+ "rstrip": false,
1389
+ "normalized": false,
1390
+ "special": true
1391
+ },
1392
+ {
1393
+ "id": 50184,
1394
+ "content": "<|pad_token[136]|>",
1395
+ "single_word": false,
1396
+ "lstrip": false,
1397
+ "rstrip": false,
1398
+ "normalized": false,
1399
+ "special": true
1400
+ },
1401
+ {
1402
+ "id": 50185,
1403
+ "content": "<|pad_token[137]|>",
1404
+ "single_word": false,
1405
+ "lstrip": false,
1406
+ "rstrip": false,
1407
+ "normalized": false,
1408
+ "special": true
1409
+ },
1410
+ {
1411
+ "id": 50186,
1412
+ "content": "<|pad_token[138]|>",
1413
+ "single_word": false,
1414
+ "lstrip": false,
1415
+ "rstrip": false,
1416
+ "normalized": false,
1417
+ "special": true
1418
+ },
1419
+ {
1420
+ "id": 50187,
1421
+ "content": "<|pad_token[139]|>",
1422
+ "single_word": false,
1423
+ "lstrip": false,
1424
+ "rstrip": false,
1425
+ "normalized": false,
1426
+ "special": true
1427
+ },
1428
+ {
1429
+ "id": 50188,
1430
+ "content": "<|pad_token[140]|>",
1431
+ "single_word": false,
1432
+ "lstrip": false,
1433
+ "rstrip": false,
1434
+ "normalized": false,
1435
+ "special": true
1436
+ },
1437
+ {
1438
+ "id": 50189,
1439
+ "content": "<|pad_token[141]|>",
1440
+ "single_word": false,
1441
+ "lstrip": false,
1442
+ "rstrip": false,
1443
+ "normalized": false,
1444
+ "special": true
1445
+ },
1446
+ {
1447
+ "id": 50190,
1448
+ "content": "<|pad_token[142]|>",
1449
+ "single_word": false,
1450
+ "lstrip": false,
1451
+ "rstrip": false,
1452
+ "normalized": false,
1453
+ "special": true
1454
+ },
1455
+ {
1456
+ "id": 50191,
1457
+ "content": "<|pad_token[143]|>",
1458
+ "single_word": false,
1459
+ "lstrip": false,
1460
+ "rstrip": false,
1461
+ "normalized": false,
1462
+ "special": true
1463
+ },
1464
+ {
1465
+ "id": 50192,
1466
+ "content": "<|pad_token[144]|>",
1467
+ "single_word": false,
1468
+ "lstrip": false,
1469
+ "rstrip": false,
1470
+ "normalized": false,
1471
+ "special": true
1472
+ },
1473
+ {
1474
+ "id": 50193,
1475
+ "content": "<|pad_token[145]|>",
1476
+ "single_word": false,
1477
+ "lstrip": false,
1478
+ "rstrip": false,
1479
+ "normalized": false,
1480
+ "special": true
1481
+ },
1482
+ {
1483
+ "id": 50194,
1484
+ "content": "<|pad_token[146]|>",
1485
+ "single_word": false,
1486
+ "lstrip": false,
1487
+ "rstrip": false,
1488
+ "normalized": false,
1489
+ "special": true
1490
+ },
1491
+ {
1492
+ "id": 50195,
1493
+ "content": "<|pad_token[147]|>",
1494
+ "single_word": false,
1495
+ "lstrip": false,
1496
+ "rstrip": false,
1497
+ "normalized": false,
1498
+ "special": true
1499
+ },
1500
+ {
1501
+ "id": 50196,
1502
+ "content": "<|pad_token[148]|>",
1503
+ "single_word": false,
1504
+ "lstrip": false,
1505
+ "rstrip": false,
1506
+ "normalized": false,
1507
+ "special": true
1508
+ },
1509
+ {
1510
+ "id": 50197,
1511
+ "content": "<|pad_token[149]|>",
1512
+ "single_word": false,
1513
+ "lstrip": false,
1514
+ "rstrip": false,
1515
+ "normalized": false,
1516
+ "special": true
1517
+ },
1518
+ {
1519
+ "id": 50198,
1520
+ "content": "<|pad_token[150]|>",
1521
+ "single_word": false,
1522
+ "lstrip": false,
1523
+ "rstrip": false,
1524
+ "normalized": false,
1525
+ "special": true
1526
+ },
1527
+ {
1528
+ "id": 50199,
1529
+ "content": "<|pad_token[151]|>",
1530
+ "single_word": false,
1531
+ "lstrip": false,
1532
+ "rstrip": false,
1533
+ "normalized": false,
1534
+ "special": true
1535
+ },
1536
+ {
1537
+ "id": 50200,
1538
+ "content": "<|pad_token[152]|>",
1539
+ "single_word": false,
1540
+ "lstrip": false,
1541
+ "rstrip": false,
1542
+ "normalized": false,
1543
+ "special": true
1544
+ },
1545
+ {
1546
+ "id": 50201,
1547
+ "content": "<|pad_token[153]|>",
1548
+ "single_word": false,
1549
+ "lstrip": false,
1550
+ "rstrip": false,
1551
+ "normalized": false,
1552
+ "special": true
1553
+ },
1554
+ {
1555
+ "id": 50202,
1556
+ "content": "<|pad_token[154]|>",
1557
+ "single_word": false,
1558
+ "lstrip": false,
1559
+ "rstrip": false,
1560
+ "normalized": false,
1561
+ "special": true
1562
+ },
1563
+ {
1564
+ "id": 50203,
1565
+ "content": "<|pad_token[155]|>",
1566
+ "single_word": false,
1567
+ "lstrip": false,
1568
+ "rstrip": false,
1569
+ "normalized": false,
1570
+ "special": true
1571
+ },
1572
+ {
1573
+ "id": 50204,
1574
+ "content": "<|pad_token[156]|>",
1575
+ "single_word": false,
1576
+ "lstrip": false,
1577
+ "rstrip": false,
1578
+ "normalized": false,
1579
+ "special": true
1580
+ },
1581
+ {
1582
+ "id": 50205,
1583
+ "content": "<|pad_token[157]|>",
1584
+ "single_word": false,
1585
+ "lstrip": false,
1586
+ "rstrip": false,
1587
+ "normalized": false,
1588
+ "special": true
1589
+ },
1590
+ {
1591
+ "id": 50206,
1592
+ "content": "<|pad_token[158]|>",
1593
+ "single_word": false,
1594
+ "lstrip": false,
1595
+ "rstrip": false,
1596
+ "normalized": false,
1597
+ "special": true
1598
+ },
1599
+ {
1600
+ "id": 50207,
1601
+ "content": "<|pad_token[159]|>",
1602
+ "single_word": false,
1603
+ "lstrip": false,
1604
+ "rstrip": false,
1605
+ "normalized": false,
1606
+ "special": true
1607
+ },
1608
+ {
1609
+ "id": 50208,
1610
+ "content": "<|pad_token[160]|>",
1611
+ "single_word": false,
1612
+ "lstrip": false,
1613
+ "rstrip": false,
1614
+ "normalized": false,
1615
+ "special": true
1616
+ },
1617
+ {
1618
+ "id": 50209,
1619
+ "content": "<|pad_token[161]|>",
1620
+ "single_word": false,
1621
+ "lstrip": false,
1622
+ "rstrip": false,
1623
+ "normalized": false,
1624
+ "special": true
1625
+ },
1626
+ {
1627
+ "id": 50210,
1628
+ "content": "<|pad_token[162]|>",
1629
+ "single_word": false,
1630
+ "lstrip": false,
1631
+ "rstrip": false,
1632
+ "normalized": false,
1633
+ "special": true
1634
+ },
1635
+ {
1636
+ "id": 50211,
1637
+ "content": "<|pad_token[163]|>",
1638
+ "single_word": false,
1639
+ "lstrip": false,
1640
+ "rstrip": false,
1641
+ "normalized": false,
1642
+ "special": true
1643
+ },
1644
+ {
1645
+ "id": 50212,
1646
+ "content": "<|pad_token[164]|>",
1647
+ "single_word": false,
1648
+ "lstrip": false,
1649
+ "rstrip": false,
1650
+ "normalized": false,
1651
+ "special": true
1652
+ },
1653
+ {
1654
+ "id": 50213,
1655
+ "content": "<|pad_token[165]|>",
1656
+ "single_word": false,
1657
+ "lstrip": false,
1658
+ "rstrip": false,
1659
+ "normalized": false,
1660
+ "special": true
1661
+ },
1662
+ {
1663
+ "id": 50214,
1664
+ "content": "<|pad_token[166]|>",
1665
+ "single_word": false,
1666
+ "lstrip": false,
1667
+ "rstrip": false,
1668
+ "normalized": false,
1669
+ "special": true
1670
+ },
1671
+ {
1672
+ "id": 50215,
1673
+ "content": "<|pad_token[167]|>",
1674
+ "single_word": false,
1675
+ "lstrip": false,
1676
+ "rstrip": false,
1677
+ "normalized": false,
1678
+ "special": true
1679
+ },
1680
+ {
1681
+ "id": 50216,
1682
+ "content": "<|pad_token[168]|>",
1683
+ "single_word": false,
1684
+ "lstrip": false,
1685
+ "rstrip": false,
1686
+ "normalized": false,
1687
+ "special": true
1688
+ },
1689
+ {
1690
+ "id": 50217,
1691
+ "content": "<|pad_token[169]|>",
1692
+ "single_word": false,
1693
+ "lstrip": false,
1694
+ "rstrip": false,
1695
+ "normalized": false,
1696
+ "special": true
1697
+ },
1698
+ {
1699
+ "id": 50218,
1700
+ "content": "<|pad_token[170]|>",
1701
+ "single_word": false,
1702
+ "lstrip": false,
1703
+ "rstrip": false,
1704
+ "normalized": false,
1705
+ "special": true
1706
+ },
1707
+ {
1708
+ "id": 50219,
1709
+ "content": "<|pad_token[171]|>",
1710
+ "single_word": false,
1711
+ "lstrip": false,
1712
+ "rstrip": false,
1713
+ "normalized": false,
1714
+ "special": true
1715
+ },
1716
+ {
1717
+ "id": 50220,
1718
+ "content": "<|pad_token[172]|>",
1719
+ "single_word": false,
1720
+ "lstrip": false,
1721
+ "rstrip": false,
1722
+ "normalized": false,
1723
+ "special": true
1724
+ },
1725
+ {
1726
+ "id": 50221,
1727
+ "content": "<|pad_token[173]|>",
1728
+ "single_word": false,
1729
+ "lstrip": false,
1730
+ "rstrip": false,
1731
+ "normalized": false,
1732
+ "special": true
1733
+ },
1734
+ {
1735
+ "id": 50222,
1736
+ "content": "<|pad_token[174]|>",
1737
+ "single_word": false,
1738
+ "lstrip": false,
1739
+ "rstrip": false,
1740
+ "normalized": false,
1741
+ "special": true
1742
+ },
1743
+ {
1744
+ "id": 50223,
1745
+ "content": "<|pad_token[175]|>",
1746
+ "single_word": false,
1747
+ "lstrip": false,
1748
+ "rstrip": false,
1749
+ "normalized": false,
1750
+ "special": true
1751
+ },
1752
+ {
1753
+ "id": 50224,
1754
+ "content": "<|pad_token[176]|>",
1755
+ "single_word": false,
1756
+ "lstrip": false,
1757
+ "rstrip": false,
1758
+ "normalized": false,
1759
+ "special": true
1760
+ },
1761
+ {
1762
+ "id": 50225,
1763
+ "content": "<|pad_token[177]|>",
1764
+ "single_word": false,
1765
+ "lstrip": false,
1766
+ "rstrip": false,
1767
+ "normalized": false,
1768
+ "special": true
1769
+ },
1770
+ {
1771
+ "id": 50226,
1772
+ "content": "<|pad_token[178]|>",
1773
+ "single_word": false,
1774
+ "lstrip": false,
1775
+ "rstrip": false,
1776
+ "normalized": false,
1777
+ "special": true
1778
+ },
1779
+ {
1780
+ "id": 50227,
1781
+ "content": "<|pad_token[179]|>",
1782
+ "single_word": false,
1783
+ "lstrip": false,
1784
+ "rstrip": false,
1785
+ "normalized": false,
1786
+ "special": true
1787
+ },
1788
+ {
1789
+ "id": 50228,
1790
+ "content": "<|pad_token[180]|>",
1791
+ "single_word": false,
1792
+ "lstrip": false,
1793
+ "rstrip": false,
1794
+ "normalized": false,
1795
+ "special": true
1796
+ },
1797
+ {
1798
+ "id": 50229,
1799
+ "content": "<|pad_token[181]|>",
1800
+ "single_word": false,
1801
+ "lstrip": false,
1802
+ "rstrip": false,
1803
+ "normalized": false,
1804
+ "special": true
1805
+ },
1806
+ {
1807
+ "id": 50230,
1808
+ "content": "<|pad_token[182]|>",
1809
+ "single_word": false,
1810
+ "lstrip": false,
1811
+ "rstrip": false,
1812
+ "normalized": false,
1813
+ "special": true
1814
+ },
1815
+ {
1816
+ "id": 50231,
1817
+ "content": "<|pad_token[183]|>",
1818
+ "single_word": false,
1819
+ "lstrip": false,
1820
+ "rstrip": false,
1821
+ "normalized": false,
1822
+ "special": true
1823
+ },
1824
+ {
1825
+ "id": 50232,
1826
+ "content": "<|pad_token[184]|>",
1827
+ "single_word": false,
1828
+ "lstrip": false,
1829
+ "rstrip": false,
1830
+ "normalized": false,
1831
+ "special": true
1832
+ },
1833
+ {
1834
+ "id": 50233,
1835
+ "content": "<|pad_token[185]|>",
1836
+ "single_word": false,
1837
+ "lstrip": false,
1838
+ "rstrip": false,
1839
+ "normalized": false,
1840
+ "special": true
1841
+ },
1842
+ {
1843
+ "id": 50234,
1844
+ "content": "<|pad_token[186]|>",
1845
+ "single_word": false,
1846
+ "lstrip": false,
1847
+ "rstrip": false,
1848
+ "normalized": false,
1849
+ "special": true
1850
+ },
1851
+ {
1852
+ "id": 50235,
1853
+ "content": "<|pad_token[187]|>",
1854
+ "single_word": false,
1855
+ "lstrip": false,
1856
+ "rstrip": false,
1857
+ "normalized": false,
1858
+ "special": true
1859
+ },
1860
+ {
1861
+ "id": 50236,
1862
+ "content": "<|pad_token[188]|>",
1863
+ "single_word": false,
1864
+ "lstrip": false,
1865
+ "rstrip": false,
1866
+ "normalized": false,
1867
+ "special": true
1868
+ },
1869
+ {
1870
+ "id": 50237,
1871
+ "content": "<|pad_token[189]|>",
1872
+ "single_word": false,
1873
+ "lstrip": false,
1874
+ "rstrip": false,
1875
+ "normalized": false,
1876
+ "special": true
1877
+ },
1878
+ {
1879
+ "id": 50238,
1880
+ "content": "<|pad_token[190]|>",
1881
+ "single_word": false,
1882
+ "lstrip": false,
1883
+ "rstrip": false,
1884
+ "normalized": false,
1885
+ "special": true
1886
+ },
1887
+ {
1888
+ "id": 50239,
1889
+ "content": "<|pad_token[191]|>",
1890
+ "single_word": false,
1891
+ "lstrip": false,
1892
+ "rstrip": false,
1893
+ "normalized": false,
1894
+ "special": true
1895
+ },
1896
+ {
1897
+ "id": 50240,
1898
+ "content": "<|pad_token[192]|>",
1899
+ "single_word": false,
1900
+ "lstrip": false,
1901
+ "rstrip": false,
1902
+ "normalized": false,
1903
+ "special": true
1904
+ },
1905
+ {
1906
+ "id": 50241,
1907
+ "content": "<|pad_token[193]|>",
1908
+ "single_word": false,
1909
+ "lstrip": false,
1910
+ "rstrip": false,
1911
+ "normalized": false,
1912
+ "special": true
1913
+ },
1914
+ {
1915
+ "id": 50242,
1916
+ "content": "<|pad_token[194]|>",
1917
+ "single_word": false,
1918
+ "lstrip": false,
1919
+ "rstrip": false,
1920
+ "normalized": false,
1921
+ "special": true
1922
+ },
1923
+ {
1924
+ "id": 50243,
1925
+ "content": "<|pad_token[195]|>",
1926
+ "single_word": false,
1927
+ "lstrip": false,
1928
+ "rstrip": false,
1929
+ "normalized": false,
1930
+ "special": true
1931
+ },
1932
+ {
1933
+ "id": 50244,
1934
+ "content": "<|pad_token[196]|>",
1935
+ "single_word": false,
1936
+ "lstrip": false,
1937
+ "rstrip": false,
1938
+ "normalized": false,
1939
+ "special": true
1940
+ },
1941
+ {
1942
+ "id": 50245,
1943
+ "content": "<|pad_token[197]|>",
1944
+ "single_word": false,
1945
+ "lstrip": false,
1946
+ "rstrip": false,
1947
+ "normalized": false,
1948
+ "special": true
1949
+ },
1950
+ {
1951
+ "id": 50246,
1952
+ "content": "<|pad_token[198]|>",
1953
+ "single_word": false,
1954
+ "lstrip": false,
1955
+ "rstrip": false,
1956
+ "normalized": false,
1957
+ "special": true
1958
+ },
1959
+ {
1960
+ "id": 50247,
1961
+ "content": "<|pad_token[199]|>",
1962
+ "single_word": false,
1963
+ "lstrip": false,
1964
+ "rstrip": false,
1965
+ "normalized": false,
1966
+ "special": true
1967
+ },
1968
+ {
1969
+ "id": 50248,
1970
+ "content": "<|pad_token[200]|>",
1971
+ "single_word": false,
1972
+ "lstrip": false,
1973
+ "rstrip": false,
1974
+ "normalized": false,
1975
+ "special": true
1976
+ },
1977
+ {
1978
+ "id": 50249,
1979
+ "content": "<|pad_token[201]|>",
1980
+ "single_word": false,
1981
+ "lstrip": false,
1982
+ "rstrip": false,
1983
+ "normalized": false,
1984
+ "special": true
1985
+ },
1986
+ {
1987
+ "id": 50250,
1988
+ "content": "<|pad_token[202]|>",
1989
+ "single_word": false,
1990
+ "lstrip": false,
1991
+ "rstrip": false,
1992
+ "normalized": false,
1993
+ "special": true
1994
+ },
1995
+ {
1996
+ "id": 50251,
1997
+ "content": "<|pad_token[203]|>",
1998
+ "single_word": false,
1999
+ "lstrip": false,
2000
+ "rstrip": false,
2001
+ "normalized": false,
2002
+ "special": true
2003
+ },
2004
+ {
2005
+ "id": 50252,
2006
+ "content": "<|pad_token[204]|>",
2007
+ "single_word": false,
2008
+ "lstrip": false,
2009
+ "rstrip": false,
2010
+ "normalized": false,
2011
+ "special": true
2012
+ },
2013
+ {
2014
+ "id": 50253,
2015
+ "content": "<|pad_token[205]|>",
2016
+ "single_word": false,
2017
+ "lstrip": false,
2018
+ "rstrip": false,
2019
+ "normalized": false,
2020
+ "special": true
2021
+ },
2022
+ {
2023
+ "id": 50254,
2024
+ "content": "<|pad_token[206]|>",
2025
+ "single_word": false,
2026
+ "lstrip": false,
2027
+ "rstrip": false,
2028
+ "normalized": false,
2029
+ "special": true
2030
+ },
2031
+ {
2032
+ "id": 50255,
2033
+ "content": "<|pad_token[207]|>",
2034
+ "single_word": false,
2035
+ "lstrip": false,
2036
+ "rstrip": false,
2037
+ "normalized": false,
2038
+ "special": true
2039
+ },
2040
+ {
2041
+ "id": 50256,
2042
+ "content": "<|pad_token[208]|>",
2043
+ "single_word": false,
2044
+ "lstrip": false,
2045
+ "rstrip": false,
2046
+ "normalized": false,
2047
+ "special": true
2048
+ },
2049
+ {
2050
+ "id": 50257,
2051
+ "content": "<|pad_token[209]|>",
2052
+ "single_word": false,
2053
+ "lstrip": false,
2054
+ "rstrip": false,
2055
+ "normalized": false,
2056
+ "special": true
2057
+ },
2058
+ {
2059
+ "id": 50258,
2060
+ "content": "<|pad_token[210]|>",
2061
+ "single_word": false,
2062
+ "lstrip": false,
2063
+ "rstrip": false,
2064
+ "normalized": false,
2065
+ "special": true
2066
+ },
2067
+ {
2068
+ "id": 50259,
2069
+ "content": "<|pad_token[211]|>",
2070
+ "single_word": false,
2071
+ "lstrip": false,
2072
+ "rstrip": false,
2073
+ "normalized": false,
2074
+ "special": true
2075
+ },
2076
+ {
2077
+ "id": 50260,
2078
+ "content": "<|pad_token[212]|>",
2079
+ "single_word": false,
2080
+ "lstrip": false,
2081
+ "rstrip": false,
2082
+ "normalized": false,
2083
+ "special": true
2084
+ },
2085
+ {
2086
+ "id": 50261,
2087
+ "content": "<|pad_token[213]|>",
2088
+ "single_word": false,
2089
+ "lstrip": false,
2090
+ "rstrip": false,
2091
+ "normalized": false,
2092
+ "special": true
2093
+ },
2094
+ {
2095
+ "id": 50262,
2096
+ "content": "<|pad_token[214]|>",
2097
+ "single_word": false,
2098
+ "lstrip": false,
2099
+ "rstrip": false,
2100
+ "normalized": false,
2101
+ "special": true
2102
+ },
2103
+ {
2104
+ "id": 50263,
2105
+ "content": "<|pad_token[215]|>",
2106
+ "single_word": false,
2107
+ "lstrip": false,
2108
+ "rstrip": false,
2109
+ "normalized": false,
2110
+ "special": true
2111
+ },
2112
+ {
2113
+ "id": 50264,
2114
+ "content": "<|pad_token[216]|>",
2115
+ "single_word": false,
2116
+ "lstrip": false,
2117
+ "rstrip": false,
2118
+ "normalized": false,
2119
+ "special": true
2120
+ },
2121
+ {
2122
+ "id": 50265,
2123
+ "content": "<|pad_token[217]|>",
2124
+ "single_word": false,
2125
+ "lstrip": false,
2126
+ "rstrip": false,
2127
+ "normalized": false,
2128
+ "special": true
2129
+ },
2130
+ {
2131
+ "id": 50266,
2132
+ "content": "<|pad_token[218]|>",
2133
+ "single_word": false,
2134
+ "lstrip": false,
2135
+ "rstrip": false,
2136
+ "normalized": false,
2137
+ "special": true
2138
+ },
2139
+ {
2140
+ "id": 50267,
2141
+ "content": "<|pad_token[219]|>",
2142
+ "single_word": false,
2143
+ "lstrip": false,
2144
+ "rstrip": false,
2145
+ "normalized": false,
2146
+ "special": true
2147
+ },
2148
+ {
2149
+ "id": 50268,
2150
+ "content": "<|pad_token[220]|>",
2151
+ "single_word": false,
2152
+ "lstrip": false,
2153
+ "rstrip": false,
2154
+ "normalized": false,
2155
+ "special": true
2156
+ },
2157
+ {
2158
+ "id": 50269,
2159
+ "content": "<|pad_token[221]|>",
2160
+ "single_word": false,
2161
+ "lstrip": false,
2162
+ "rstrip": false,
2163
+ "normalized": false,
2164
+ "special": true
2165
+ },
2166
+ {
2167
+ "id": 50270,
2168
+ "content": "<|pad_token[222]|>",
2169
+ "single_word": false,
2170
+ "lstrip": false,
2171
+ "rstrip": false,
2172
+ "normalized": false,
2173
+ "special": true
2174
+ },
2175
+ {
2176
+ "id": 50271,
2177
+ "content": "<|pad_token[223]|>",
2178
+ "single_word": false,
2179
+ "lstrip": false,
2180
+ "rstrip": false,
2181
+ "normalized": false,
2182
+ "special": true
2183
+ },
2184
+ {
2185
+ "id": 50272,
2186
+ "content": "<|pad_token[224]|>",
2187
+ "single_word": false,
2188
+ "lstrip": false,
2189
+ "rstrip": false,
2190
+ "normalized": false,
2191
+ "special": true
2192
+ },
2193
+ {
2194
+ "id": 50273,
2195
+ "content": "<|pad_token[225]|>",
2196
+ "single_word": false,
2197
+ "lstrip": false,
2198
+ "rstrip": false,
2199
+ "normalized": false,
2200
+ "special": true
2201
+ },
2202
+ {
2203
+ "id": 50274,
2204
+ "content": "<|pad_token[226]|>",
2205
+ "single_word": false,
2206
+ "lstrip": false,
2207
+ "rstrip": false,
2208
+ "normalized": false,
2209
+ "special": true
2210
+ },
2211
+ {
2212
+ "id": 50275,
2213
+ "content": "<|pad_token[227]|>",
2214
+ "single_word": false,
2215
+ "lstrip": false,
2216
+ "rstrip": false,
2217
+ "normalized": false,
2218
+ "special": true
2219
+ },
2220
+ {
2221
+ "id": 50276,
2222
+ "content": "<|pad_token[228]|>",
2223
+ "single_word": false,
2224
+ "lstrip": false,
2225
+ "rstrip": false,
2226
+ "normalized": false,
2227
+ "special": true
2228
+ },
2229
+ {
2230
+ "id": 50277,
2231
+ "content": "<|pad_token[229]|>",
2232
+ "single_word": false,
2233
+ "lstrip": false,
2234
+ "rstrip": false,
2235
+ "normalized": false,
2236
+ "special": true
2237
+ },
2238
+ {
2239
+ "id": 50278,
2240
+ "content": "<|pad_token[230]|>",
2241
+ "single_word": false,
2242
+ "lstrip": false,
2243
+ "rstrip": false,
2244
+ "normalized": false,
2245
+ "special": true
2246
+ },
2247
+ {
2248
+ "id": 50279,
2249
+ "content": "<|pad_token[231]|>",
2250
+ "single_word": false,
2251
+ "lstrip": false,
2252
+ "rstrip": false,
2253
+ "normalized": false,
2254
+ "special": true
2255
+ },
2256
+ {
2257
+ "id": 50280,
2258
+ "content": "<|pad_token[232]|>",
2259
+ "single_word": false,
2260
+ "lstrip": false,
2261
+ "rstrip": false,
2262
+ "normalized": false,
2263
+ "special": true
2264
+ },
2265
+ {
2266
+ "id": 50281,
2267
+ "content": "<|pad_token[233]|>",
2268
+ "single_word": false,
2269
+ "lstrip": false,
2270
+ "rstrip": false,
2271
+ "normalized": false,
2272
+ "special": true
2273
+ },
2274
+ {
2275
+ "id": 50282,
2276
+ "content": "<|pad_token[234]|>",
2277
+ "single_word": false,
2278
+ "lstrip": false,
2279
+ "rstrip": false,
2280
+ "normalized": false,
2281
+ "special": true
2282
+ },
2283
+ {
2284
+ "id": 50283,
2285
+ "content": "<|pad_token[235]|>",
2286
+ "single_word": false,
2287
+ "lstrip": false,
2288
+ "rstrip": false,
2289
+ "normalized": false,
2290
+ "special": true
2291
+ },
2292
+ {
2293
+ "id": 50284,
2294
+ "content": "<|pad_token[236]|>",
2295
+ "single_word": false,
2296
+ "lstrip": false,
2297
+ "rstrip": false,
2298
+ "normalized": false,
2299
+ "special": true
2300
+ },
2301
+ {
2302
+ "id": 50285,
2303
+ "content": "<|pad_token[237]|>",
2304
+ "single_word": false,
2305
+ "lstrip": false,
2306
+ "rstrip": false,
2307
+ "normalized": false,
2308
+ "special": true
2309
+ },
2310
+ {
2311
+ "id": 50286,
2312
+ "content": "<|pad_token[238]|>",
2313
+ "single_word": false,
2314
+ "lstrip": false,
2315
+ "rstrip": false,
2316
+ "normalized": false,
2317
+ "special": true
2318
+ },
2319
+ {
2320
+ "id": 50287,
2321
+ "content": "<|pad_token[239]|>",
2322
+ "single_word": false,
2323
+ "lstrip": false,
2324
+ "rstrip": false,
2325
+ "normalized": false,
2326
+ "special": true
2327
+ },
2328
+ {
2329
+ "id": 50288,
2330
+ "content": "<|pad_token[240]|>",
2331
+ "single_word": false,
2332
+ "lstrip": false,
2333
+ "rstrip": false,
2334
+ "normalized": false,
2335
+ "special": true
2336
+ },
2337
+ {
2338
+ "id": 50289,
2339
+ "content": "<|pad_token[241]|>",
2340
+ "single_word": false,
2341
+ "lstrip": false,
2342
+ "rstrip": false,
2343
+ "normalized": false,
2344
+ "special": true
2345
+ },
2346
+ {
2347
+ "id": 50290,
2348
+ "content": "<|pad_token[242]|>",
2349
+ "single_word": false,
2350
+ "lstrip": false,
2351
+ "rstrip": false,
2352
+ "normalized": false,
2353
+ "special": true
2354
+ },
2355
+ {
2356
+ "id": 50291,
2357
+ "content": "<|pad_token[243]|>",
2358
+ "single_word": false,
2359
+ "lstrip": false,
2360
+ "rstrip": false,
2361
+ "normalized": false,
2362
+ "special": true
2363
+ },
2364
+ {
2365
+ "id": 50292,
2366
+ "content": "<|pad_token[244]|>",
2367
+ "single_word": false,
2368
+ "lstrip": false,
2369
+ "rstrip": false,
2370
+ "normalized": false,
2371
+ "special": true
2372
+ },
2373
+ {
2374
+ "id": 50293,
2375
+ "content": "<|pad_token[245]|>",
2376
+ "single_word": false,
2377
+ "lstrip": false,
2378
+ "rstrip": false,
2379
+ "normalized": false,
2380
+ "special": true
2381
+ },
2382
+ {
2383
+ "id": 50294,
2384
+ "content": "<|pad_token[246]|>",
2385
+ "single_word": false,
2386
+ "lstrip": false,
2387
+ "rstrip": false,
2388
+ "normalized": false,
2389
+ "special": true
2390
+ },
2391
+ {
2392
+ "id": 50295,
2393
+ "content": "<|pad_token[247]|>",
2394
+ "single_word": false,
2395
+ "lstrip": false,
2396
+ "rstrip": false,
2397
+ "normalized": false,
2398
+ "special": true
2399
+ },
2400
+ {
2401
+ "id": 50296,
2402
+ "content": "<|pad_token[248]|>",
2403
+ "single_word": false,
2404
+ "lstrip": false,
2405
+ "rstrip": false,
2406
+ "normalized": false,
2407
+ "special": true
2408
+ },
2409
+ {
2410
+ "id": 50297,
2411
+ "content": "<|pad_token[249]|>",
2412
+ "single_word": false,
2413
+ "lstrip": false,
2414
+ "rstrip": false,
2415
+ "normalized": false,
2416
+ "special": true
2417
+ },
2418
+ {
2419
+ "id": 50298,
2420
+ "content": "<|pad_token[250]|>",
2421
+ "single_word": false,
2422
+ "lstrip": false,
2423
+ "rstrip": false,
2424
+ "normalized": false,
2425
+ "special": true
2426
+ },
2427
+ {
2428
+ "id": 50299,
2429
+ "content": "<|pad_token[251]|>",
2430
+ "single_word": false,
2431
+ "lstrip": false,
2432
+ "rstrip": false,
2433
+ "normalized": false,
2434
+ "special": true
2435
+ },
2436
+ {
2437
+ "id": 50300,
2438
+ "content": "<|pad_token[252]|>",
2439
+ "single_word": false,
2440
+ "lstrip": false,
2441
+ "rstrip": false,
2442
+ "normalized": false,
2443
+ "special": true
2444
+ },
2445
+ {
2446
+ "id": 50301,
2447
+ "content": "<|pad_token[253]|>",
2448
+ "single_word": false,
2449
+ "lstrip": false,
2450
+ "rstrip": false,
2451
+ "normalized": false,
2452
+ "special": true
2453
+ },
2454
+ {
2455
+ "id": 50302,
2456
+ "content": "<|pad_token[254]|>",
2457
+ "single_word": false,
2458
+ "lstrip": false,
2459
+ "rstrip": false,
2460
+ "normalized": false,
2461
+ "special": true
2462
+ },
2463
+ {
2464
+ "id": 50303,
2465
+ "content": "<|pad_token[255]|>",
2466
+ "single_word": false,
2467
+ "lstrip": false,
2468
+ "rstrip": false,
2469
+ "normalized": false,
2470
+ "special": true
2471
  }
2472
  ],
2473
  "normalizer": null,
last-checkpoint/tokenizer_config.json CHANGED
@@ -3,8 +3,8 @@
3
  "bos_token": "<|begin_of_text|>",
4
  "clean_up_tokenization_spaces": true,
5
  "eos_token": "<|end_of_text|>",
 
6
  "is_local": true,
7
- "local_files_only": false,
8
  "model_input_names": [
9
  "input_ids",
10
  "attention_mask"
@@ -158,6 +158,2054 @@
158
  "rstrip": false,
159
  "normalized": false,
160
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
161
  }
162
  }
163
  }
 
3
  "bos_token": "<|begin_of_text|>",
4
  "clean_up_tokenization_spaces": true,
5
  "eos_token": "<|end_of_text|>",
6
+ "extra_special_tokens": [],
7
  "is_local": true,
 
8
  "model_input_names": [
9
  "input_ids",
10
  "attention_mask"
 
158
  "rstrip": false,
159
  "normalized": false,
160
  "special": true
161
+ },
162
+ "50048": {
163
+ "content": "<|pad_token[0]|>",
164
+ "single_word": false,
165
+ "lstrip": false,
166
+ "rstrip": false,
167
+ "normalized": false,
168
+ "special": true
169
+ },
170
+ "50049": {
171
+ "content": "<|pad_token[1]|>",
172
+ "single_word": false,
173
+ "lstrip": false,
174
+ "rstrip": false,
175
+ "normalized": false,
176
+ "special": true
177
+ },
178
+ "50050": {
179
+ "content": "<|pad_token[2]|>",
180
+ "single_word": false,
181
+ "lstrip": false,
182
+ "rstrip": false,
183
+ "normalized": false,
184
+ "special": true
185
+ },
186
+ "50051": {
187
+ "content": "<|pad_token[3]|>",
188
+ "single_word": false,
189
+ "lstrip": false,
190
+ "rstrip": false,
191
+ "normalized": false,
192
+ "special": true
193
+ },
194
+ "50052": {
195
+ "content": "<|pad_token[4]|>",
196
+ "single_word": false,
197
+ "lstrip": false,
198
+ "rstrip": false,
199
+ "normalized": false,
200
+ "special": true
201
+ },
202
+ "50053": {
203
+ "content": "<|pad_token[5]|>",
204
+ "single_word": false,
205
+ "lstrip": false,
206
+ "rstrip": false,
207
+ "normalized": false,
208
+ "special": true
209
+ },
210
+ "50054": {
211
+ "content": "<|pad_token[6]|>",
212
+ "single_word": false,
213
+ "lstrip": false,
214
+ "rstrip": false,
215
+ "normalized": false,
216
+ "special": true
217
+ },
218
+ "50055": {
219
+ "content": "<|pad_token[7]|>",
220
+ "single_word": false,
221
+ "lstrip": false,
222
+ "rstrip": false,
223
+ "normalized": false,
224
+ "special": true
225
+ },
226
+ "50056": {
227
+ "content": "<|pad_token[8]|>",
228
+ "single_word": false,
229
+ "lstrip": false,
230
+ "rstrip": false,
231
+ "normalized": false,
232
+ "special": true
233
+ },
234
+ "50057": {
235
+ "content": "<|pad_token[9]|>",
236
+ "single_word": false,
237
+ "lstrip": false,
238
+ "rstrip": false,
239
+ "normalized": false,
240
+ "special": true
241
+ },
242
+ "50058": {
243
+ "content": "<|pad_token[10]|>",
244
+ "single_word": false,
245
+ "lstrip": false,
246
+ "rstrip": false,
247
+ "normalized": false,
248
+ "special": true
249
+ },
250
+ "50059": {
251
+ "content": "<|pad_token[11]|>",
252
+ "single_word": false,
253
+ "lstrip": false,
254
+ "rstrip": false,
255
+ "normalized": false,
256
+ "special": true
257
+ },
258
+ "50060": {
259
+ "content": "<|pad_token[12]|>",
260
+ "single_word": false,
261
+ "lstrip": false,
262
+ "rstrip": false,
263
+ "normalized": false,
264
+ "special": true
265
+ },
266
+ "50061": {
267
+ "content": "<|pad_token[13]|>",
268
+ "single_word": false,
269
+ "lstrip": false,
270
+ "rstrip": false,
271
+ "normalized": false,
272
+ "special": true
273
+ },
274
+ "50062": {
275
+ "content": "<|pad_token[14]|>",
276
+ "single_word": false,
277
+ "lstrip": false,
278
+ "rstrip": false,
279
+ "normalized": false,
280
+ "special": true
281
+ },
282
+ "50063": {
283
+ "content": "<|pad_token[15]|>",
284
+ "single_word": false,
285
+ "lstrip": false,
286
+ "rstrip": false,
287
+ "normalized": false,
288
+ "special": true
289
+ },
290
+ "50064": {
291
+ "content": "<|pad_token[16]|>",
292
+ "single_word": false,
293
+ "lstrip": false,
294
+ "rstrip": false,
295
+ "normalized": false,
296
+ "special": true
297
+ },
298
+ "50065": {
299
+ "content": "<|pad_token[17]|>",
300
+ "single_word": false,
301
+ "lstrip": false,
302
+ "rstrip": false,
303
+ "normalized": false,
304
+ "special": true
305
+ },
306
+ "50066": {
307
+ "content": "<|pad_token[18]|>",
308
+ "single_word": false,
309
+ "lstrip": false,
310
+ "rstrip": false,
311
+ "normalized": false,
312
+ "special": true
313
+ },
314
+ "50067": {
315
+ "content": "<|pad_token[19]|>",
316
+ "single_word": false,
317
+ "lstrip": false,
318
+ "rstrip": false,
319
+ "normalized": false,
320
+ "special": true
321
+ },
322
+ "50068": {
323
+ "content": "<|pad_token[20]|>",
324
+ "single_word": false,
325
+ "lstrip": false,
326
+ "rstrip": false,
327
+ "normalized": false,
328
+ "special": true
329
+ },
330
+ "50069": {
331
+ "content": "<|pad_token[21]|>",
332
+ "single_word": false,
333
+ "lstrip": false,
334
+ "rstrip": false,
335
+ "normalized": false,
336
+ "special": true
337
+ },
338
+ "50070": {
339
+ "content": "<|pad_token[22]|>",
340
+ "single_word": false,
341
+ "lstrip": false,
342
+ "rstrip": false,
343
+ "normalized": false,
344
+ "special": true
345
+ },
346
+ "50071": {
347
+ "content": "<|pad_token[23]|>",
348
+ "single_word": false,
349
+ "lstrip": false,
350
+ "rstrip": false,
351
+ "normalized": false,
352
+ "special": true
353
+ },
354
+ "50072": {
355
+ "content": "<|pad_token[24]|>",
356
+ "single_word": false,
357
+ "lstrip": false,
358
+ "rstrip": false,
359
+ "normalized": false,
360
+ "special": true
361
+ },
362
+ "50073": {
363
+ "content": "<|pad_token[25]|>",
364
+ "single_word": false,
365
+ "lstrip": false,
366
+ "rstrip": false,
367
+ "normalized": false,
368
+ "special": true
369
+ },
370
+ "50074": {
371
+ "content": "<|pad_token[26]|>",
372
+ "single_word": false,
373
+ "lstrip": false,
374
+ "rstrip": false,
375
+ "normalized": false,
376
+ "special": true
377
+ },
378
+ "50075": {
379
+ "content": "<|pad_token[27]|>",
380
+ "single_word": false,
381
+ "lstrip": false,
382
+ "rstrip": false,
383
+ "normalized": false,
384
+ "special": true
385
+ },
386
+ "50076": {
387
+ "content": "<|pad_token[28]|>",
388
+ "single_word": false,
389
+ "lstrip": false,
390
+ "rstrip": false,
391
+ "normalized": false,
392
+ "special": true
393
+ },
394
+ "50077": {
395
+ "content": "<|pad_token[29]|>",
396
+ "single_word": false,
397
+ "lstrip": false,
398
+ "rstrip": false,
399
+ "normalized": false,
400
+ "special": true
401
+ },
402
+ "50078": {
403
+ "content": "<|pad_token[30]|>",
404
+ "single_word": false,
405
+ "lstrip": false,
406
+ "rstrip": false,
407
+ "normalized": false,
408
+ "special": true
409
+ },
410
+ "50079": {
411
+ "content": "<|pad_token[31]|>",
412
+ "single_word": false,
413
+ "lstrip": false,
414
+ "rstrip": false,
415
+ "normalized": false,
416
+ "special": true
417
+ },
418
+ "50080": {
419
+ "content": "<|pad_token[32]|>",
420
+ "single_word": false,
421
+ "lstrip": false,
422
+ "rstrip": false,
423
+ "normalized": false,
424
+ "special": true
425
+ },
426
+ "50081": {
427
+ "content": "<|pad_token[33]|>",
428
+ "single_word": false,
429
+ "lstrip": false,
430
+ "rstrip": false,
431
+ "normalized": false,
432
+ "special": true
433
+ },
434
+ "50082": {
435
+ "content": "<|pad_token[34]|>",
436
+ "single_word": false,
437
+ "lstrip": false,
438
+ "rstrip": false,
439
+ "normalized": false,
440
+ "special": true
441
+ },
442
+ "50083": {
443
+ "content": "<|pad_token[35]|>",
444
+ "single_word": false,
445
+ "lstrip": false,
446
+ "rstrip": false,
447
+ "normalized": false,
448
+ "special": true
449
+ },
450
+ "50084": {
451
+ "content": "<|pad_token[36]|>",
452
+ "single_word": false,
453
+ "lstrip": false,
454
+ "rstrip": false,
455
+ "normalized": false,
456
+ "special": true
457
+ },
458
+ "50085": {
459
+ "content": "<|pad_token[37]|>",
460
+ "single_word": false,
461
+ "lstrip": false,
462
+ "rstrip": false,
463
+ "normalized": false,
464
+ "special": true
465
+ },
466
+ "50086": {
467
+ "content": "<|pad_token[38]|>",
468
+ "single_word": false,
469
+ "lstrip": false,
470
+ "rstrip": false,
471
+ "normalized": false,
472
+ "special": true
473
+ },
474
+ "50087": {
475
+ "content": "<|pad_token[39]|>",
476
+ "single_word": false,
477
+ "lstrip": false,
478
+ "rstrip": false,
479
+ "normalized": false,
480
+ "special": true
481
+ },
482
+ "50088": {
483
+ "content": "<|pad_token[40]|>",
484
+ "single_word": false,
485
+ "lstrip": false,
486
+ "rstrip": false,
487
+ "normalized": false,
488
+ "special": true
489
+ },
490
+ "50089": {
491
+ "content": "<|pad_token[41]|>",
492
+ "single_word": false,
493
+ "lstrip": false,
494
+ "rstrip": false,
495
+ "normalized": false,
496
+ "special": true
497
+ },
498
+ "50090": {
499
+ "content": "<|pad_token[42]|>",
500
+ "single_word": false,
501
+ "lstrip": false,
502
+ "rstrip": false,
503
+ "normalized": false,
504
+ "special": true
505
+ },
506
+ "50091": {
507
+ "content": "<|pad_token[43]|>",
508
+ "single_word": false,
509
+ "lstrip": false,
510
+ "rstrip": false,
511
+ "normalized": false,
512
+ "special": true
513
+ },
514
+ "50092": {
515
+ "content": "<|pad_token[44]|>",
516
+ "single_word": false,
517
+ "lstrip": false,
518
+ "rstrip": false,
519
+ "normalized": false,
520
+ "special": true
521
+ },
522
+ "50093": {
523
+ "content": "<|pad_token[45]|>",
524
+ "single_word": false,
525
+ "lstrip": false,
526
+ "rstrip": false,
527
+ "normalized": false,
528
+ "special": true
529
+ },
530
+ "50094": {
531
+ "content": "<|pad_token[46]|>",
532
+ "single_word": false,
533
+ "lstrip": false,
534
+ "rstrip": false,
535
+ "normalized": false,
536
+ "special": true
537
+ },
538
+ "50095": {
539
+ "content": "<|pad_token[47]|>",
540
+ "single_word": false,
541
+ "lstrip": false,
542
+ "rstrip": false,
543
+ "normalized": false,
544
+ "special": true
545
+ },
546
+ "50096": {
547
+ "content": "<|pad_token[48]|>",
548
+ "single_word": false,
549
+ "lstrip": false,
550
+ "rstrip": false,
551
+ "normalized": false,
552
+ "special": true
553
+ },
554
+ "50097": {
555
+ "content": "<|pad_token[49]|>",
556
+ "single_word": false,
557
+ "lstrip": false,
558
+ "rstrip": false,
559
+ "normalized": false,
560
+ "special": true
561
+ },
562
+ "50098": {
563
+ "content": "<|pad_token[50]|>",
564
+ "single_word": false,
565
+ "lstrip": false,
566
+ "rstrip": false,
567
+ "normalized": false,
568
+ "special": true
569
+ },
570
+ "50099": {
571
+ "content": "<|pad_token[51]|>",
572
+ "single_word": false,
573
+ "lstrip": false,
574
+ "rstrip": false,
575
+ "normalized": false,
576
+ "special": true
577
+ },
578
+ "50100": {
579
+ "content": "<|pad_token[52]|>",
580
+ "single_word": false,
581
+ "lstrip": false,
582
+ "rstrip": false,
583
+ "normalized": false,
584
+ "special": true
585
+ },
586
+ "50101": {
587
+ "content": "<|pad_token[53]|>",
588
+ "single_word": false,
589
+ "lstrip": false,
590
+ "rstrip": false,
591
+ "normalized": false,
592
+ "special": true
593
+ },
594
+ "50102": {
595
+ "content": "<|pad_token[54]|>",
596
+ "single_word": false,
597
+ "lstrip": false,
598
+ "rstrip": false,
599
+ "normalized": false,
600
+ "special": true
601
+ },
602
+ "50103": {
603
+ "content": "<|pad_token[55]|>",
604
+ "single_word": false,
605
+ "lstrip": false,
606
+ "rstrip": false,
607
+ "normalized": false,
608
+ "special": true
609
+ },
610
+ "50104": {
611
+ "content": "<|pad_token[56]|>",
612
+ "single_word": false,
613
+ "lstrip": false,
614
+ "rstrip": false,
615
+ "normalized": false,
616
+ "special": true
617
+ },
618
+ "50105": {
619
+ "content": "<|pad_token[57]|>",
620
+ "single_word": false,
621
+ "lstrip": false,
622
+ "rstrip": false,
623
+ "normalized": false,
624
+ "special": true
625
+ },
626
+ "50106": {
627
+ "content": "<|pad_token[58]|>",
628
+ "single_word": false,
629
+ "lstrip": false,
630
+ "rstrip": false,
631
+ "normalized": false,
632
+ "special": true
633
+ },
634
+ "50107": {
635
+ "content": "<|pad_token[59]|>",
636
+ "single_word": false,
637
+ "lstrip": false,
638
+ "rstrip": false,
639
+ "normalized": false,
640
+ "special": true
641
+ },
642
+ "50108": {
643
+ "content": "<|pad_token[60]|>",
644
+ "single_word": false,
645
+ "lstrip": false,
646
+ "rstrip": false,
647
+ "normalized": false,
648
+ "special": true
649
+ },
650
+ "50109": {
651
+ "content": "<|pad_token[61]|>",
652
+ "single_word": false,
653
+ "lstrip": false,
654
+ "rstrip": false,
655
+ "normalized": false,
656
+ "special": true
657
+ },
658
+ "50110": {
659
+ "content": "<|pad_token[62]|>",
660
+ "single_word": false,
661
+ "lstrip": false,
662
+ "rstrip": false,
663
+ "normalized": false,
664
+ "special": true
665
+ },
666
+ "50111": {
667
+ "content": "<|pad_token[63]|>",
668
+ "single_word": false,
669
+ "lstrip": false,
670
+ "rstrip": false,
671
+ "normalized": false,
672
+ "special": true
673
+ },
674
+ "50112": {
675
+ "content": "<|pad_token[64]|>",
676
+ "single_word": false,
677
+ "lstrip": false,
678
+ "rstrip": false,
679
+ "normalized": false,
680
+ "special": true
681
+ },
682
+ "50113": {
683
+ "content": "<|pad_token[65]|>",
684
+ "single_word": false,
685
+ "lstrip": false,
686
+ "rstrip": false,
687
+ "normalized": false,
688
+ "special": true
689
+ },
690
+ "50114": {
691
+ "content": "<|pad_token[66]|>",
692
+ "single_word": false,
693
+ "lstrip": false,
694
+ "rstrip": false,
695
+ "normalized": false,
696
+ "special": true
697
+ },
698
+ "50115": {
699
+ "content": "<|pad_token[67]|>",
700
+ "single_word": false,
701
+ "lstrip": false,
702
+ "rstrip": false,
703
+ "normalized": false,
704
+ "special": true
705
+ },
706
+ "50116": {
707
+ "content": "<|pad_token[68]|>",
708
+ "single_word": false,
709
+ "lstrip": false,
710
+ "rstrip": false,
711
+ "normalized": false,
712
+ "special": true
713
+ },
714
+ "50117": {
715
+ "content": "<|pad_token[69]|>",
716
+ "single_word": false,
717
+ "lstrip": false,
718
+ "rstrip": false,
719
+ "normalized": false,
720
+ "special": true
721
+ },
722
+ "50118": {
723
+ "content": "<|pad_token[70]|>",
724
+ "single_word": false,
725
+ "lstrip": false,
726
+ "rstrip": false,
727
+ "normalized": false,
728
+ "special": true
729
+ },
730
+ "50119": {
731
+ "content": "<|pad_token[71]|>",
732
+ "single_word": false,
733
+ "lstrip": false,
734
+ "rstrip": false,
735
+ "normalized": false,
736
+ "special": true
737
+ },
738
+ "50120": {
739
+ "content": "<|pad_token[72]|>",
740
+ "single_word": false,
741
+ "lstrip": false,
742
+ "rstrip": false,
743
+ "normalized": false,
744
+ "special": true
745
+ },
746
+ "50121": {
747
+ "content": "<|pad_token[73]|>",
748
+ "single_word": false,
749
+ "lstrip": false,
750
+ "rstrip": false,
751
+ "normalized": false,
752
+ "special": true
753
+ },
754
+ "50122": {
755
+ "content": "<|pad_token[74]|>",
756
+ "single_word": false,
757
+ "lstrip": false,
758
+ "rstrip": false,
759
+ "normalized": false,
760
+ "special": true
761
+ },
762
+ "50123": {
763
+ "content": "<|pad_token[75]|>",
764
+ "single_word": false,
765
+ "lstrip": false,
766
+ "rstrip": false,
767
+ "normalized": false,
768
+ "special": true
769
+ },
770
+ "50124": {
771
+ "content": "<|pad_token[76]|>",
772
+ "single_word": false,
773
+ "lstrip": false,
774
+ "rstrip": false,
775
+ "normalized": false,
776
+ "special": true
777
+ },
778
+ "50125": {
779
+ "content": "<|pad_token[77]|>",
780
+ "single_word": false,
781
+ "lstrip": false,
782
+ "rstrip": false,
783
+ "normalized": false,
784
+ "special": true
785
+ },
786
+ "50126": {
787
+ "content": "<|pad_token[78]|>",
788
+ "single_word": false,
789
+ "lstrip": false,
790
+ "rstrip": false,
791
+ "normalized": false,
792
+ "special": true
793
+ },
794
+ "50127": {
795
+ "content": "<|pad_token[79]|>",
796
+ "single_word": false,
797
+ "lstrip": false,
798
+ "rstrip": false,
799
+ "normalized": false,
800
+ "special": true
801
+ },
802
+ "50128": {
803
+ "content": "<|pad_token[80]|>",
804
+ "single_word": false,
805
+ "lstrip": false,
806
+ "rstrip": false,
807
+ "normalized": false,
808
+ "special": true
809
+ },
810
+ "50129": {
811
+ "content": "<|pad_token[81]|>",
812
+ "single_word": false,
813
+ "lstrip": false,
814
+ "rstrip": false,
815
+ "normalized": false,
816
+ "special": true
817
+ },
818
+ "50130": {
819
+ "content": "<|pad_token[82]|>",
820
+ "single_word": false,
821
+ "lstrip": false,
822
+ "rstrip": false,
823
+ "normalized": false,
824
+ "special": true
825
+ },
826
+ "50131": {
827
+ "content": "<|pad_token[83]|>",
828
+ "single_word": false,
829
+ "lstrip": false,
830
+ "rstrip": false,
831
+ "normalized": false,
832
+ "special": true
833
+ },
834
+ "50132": {
835
+ "content": "<|pad_token[84]|>",
836
+ "single_word": false,
837
+ "lstrip": false,
838
+ "rstrip": false,
839
+ "normalized": false,
840
+ "special": true
841
+ },
842
+ "50133": {
843
+ "content": "<|pad_token[85]|>",
844
+ "single_word": false,
845
+ "lstrip": false,
846
+ "rstrip": false,
847
+ "normalized": false,
848
+ "special": true
849
+ },
850
+ "50134": {
851
+ "content": "<|pad_token[86]|>",
852
+ "single_word": false,
853
+ "lstrip": false,
854
+ "rstrip": false,
855
+ "normalized": false,
856
+ "special": true
857
+ },
858
+ "50135": {
859
+ "content": "<|pad_token[87]|>",
860
+ "single_word": false,
861
+ "lstrip": false,
862
+ "rstrip": false,
863
+ "normalized": false,
864
+ "special": true
865
+ },
866
+ "50136": {
867
+ "content": "<|pad_token[88]|>",
868
+ "single_word": false,
869
+ "lstrip": false,
870
+ "rstrip": false,
871
+ "normalized": false,
872
+ "special": true
873
+ },
874
+ "50137": {
875
+ "content": "<|pad_token[89]|>",
876
+ "single_word": false,
877
+ "lstrip": false,
878
+ "rstrip": false,
879
+ "normalized": false,
880
+ "special": true
881
+ },
882
+ "50138": {
883
+ "content": "<|pad_token[90]|>",
884
+ "single_word": false,
885
+ "lstrip": false,
886
+ "rstrip": false,
887
+ "normalized": false,
888
+ "special": true
889
+ },
890
+ "50139": {
891
+ "content": "<|pad_token[91]|>",
892
+ "single_word": false,
893
+ "lstrip": false,
894
+ "rstrip": false,
895
+ "normalized": false,
896
+ "special": true
897
+ },
898
+ "50140": {
899
+ "content": "<|pad_token[92]|>",
900
+ "single_word": false,
901
+ "lstrip": false,
902
+ "rstrip": false,
903
+ "normalized": false,
904
+ "special": true
905
+ },
906
+ "50141": {
907
+ "content": "<|pad_token[93]|>",
908
+ "single_word": false,
909
+ "lstrip": false,
910
+ "rstrip": false,
911
+ "normalized": false,
912
+ "special": true
913
+ },
914
+ "50142": {
915
+ "content": "<|pad_token[94]|>",
916
+ "single_word": false,
917
+ "lstrip": false,
918
+ "rstrip": false,
919
+ "normalized": false,
920
+ "special": true
921
+ },
922
+ "50143": {
923
+ "content": "<|pad_token[95]|>",
924
+ "single_word": false,
925
+ "lstrip": false,
926
+ "rstrip": false,
927
+ "normalized": false,
928
+ "special": true
929
+ },
930
+ "50144": {
931
+ "content": "<|pad_token[96]|>",
932
+ "single_word": false,
933
+ "lstrip": false,
934
+ "rstrip": false,
935
+ "normalized": false,
936
+ "special": true
937
+ },
938
+ "50145": {
939
+ "content": "<|pad_token[97]|>",
940
+ "single_word": false,
941
+ "lstrip": false,
942
+ "rstrip": false,
943
+ "normalized": false,
944
+ "special": true
945
+ },
946
+ "50146": {
947
+ "content": "<|pad_token[98]|>",
948
+ "single_word": false,
949
+ "lstrip": false,
950
+ "rstrip": false,
951
+ "normalized": false,
952
+ "special": true
953
+ },
954
+ "50147": {
955
+ "content": "<|pad_token[99]|>",
956
+ "single_word": false,
957
+ "lstrip": false,
958
+ "rstrip": false,
959
+ "normalized": false,
960
+ "special": true
961
+ },
962
+ "50148": {
963
+ "content": "<|pad_token[100]|>",
964
+ "single_word": false,
965
+ "lstrip": false,
966
+ "rstrip": false,
967
+ "normalized": false,
968
+ "special": true
969
+ },
970
+ "50149": {
971
+ "content": "<|pad_token[101]|>",
972
+ "single_word": false,
973
+ "lstrip": false,
974
+ "rstrip": false,
975
+ "normalized": false,
976
+ "special": true
977
+ },
978
+ "50150": {
979
+ "content": "<|pad_token[102]|>",
980
+ "single_word": false,
981
+ "lstrip": false,
982
+ "rstrip": false,
983
+ "normalized": false,
984
+ "special": true
985
+ },
986
+ "50151": {
987
+ "content": "<|pad_token[103]|>",
988
+ "single_word": false,
989
+ "lstrip": false,
990
+ "rstrip": false,
991
+ "normalized": false,
992
+ "special": true
993
+ },
994
+ "50152": {
995
+ "content": "<|pad_token[104]|>",
996
+ "single_word": false,
997
+ "lstrip": false,
998
+ "rstrip": false,
999
+ "normalized": false,
1000
+ "special": true
1001
+ },
1002
+ "50153": {
1003
+ "content": "<|pad_token[105]|>",
1004
+ "single_word": false,
1005
+ "lstrip": false,
1006
+ "rstrip": false,
1007
+ "normalized": false,
1008
+ "special": true
1009
+ },
1010
+ "50154": {
1011
+ "content": "<|pad_token[106]|>",
1012
+ "single_word": false,
1013
+ "lstrip": false,
1014
+ "rstrip": false,
1015
+ "normalized": false,
1016
+ "special": true
1017
+ },
1018
+ "50155": {
1019
+ "content": "<|pad_token[107]|>",
1020
+ "single_word": false,
1021
+ "lstrip": false,
1022
+ "rstrip": false,
1023
+ "normalized": false,
1024
+ "special": true
1025
+ },
1026
+ "50156": {
1027
+ "content": "<|pad_token[108]|>",
1028
+ "single_word": false,
1029
+ "lstrip": false,
1030
+ "rstrip": false,
1031
+ "normalized": false,
1032
+ "special": true
1033
+ },
1034
+ "50157": {
1035
+ "content": "<|pad_token[109]|>",
1036
+ "single_word": false,
1037
+ "lstrip": false,
1038
+ "rstrip": false,
1039
+ "normalized": false,
1040
+ "special": true
1041
+ },
1042
+ "50158": {
1043
+ "content": "<|pad_token[110]|>",
1044
+ "single_word": false,
1045
+ "lstrip": false,
1046
+ "rstrip": false,
1047
+ "normalized": false,
1048
+ "special": true
1049
+ },
1050
+ "50159": {
1051
+ "content": "<|pad_token[111]|>",
1052
+ "single_word": false,
1053
+ "lstrip": false,
1054
+ "rstrip": false,
1055
+ "normalized": false,
1056
+ "special": true
1057
+ },
1058
+ "50160": {
1059
+ "content": "<|pad_token[112]|>",
1060
+ "single_word": false,
1061
+ "lstrip": false,
1062
+ "rstrip": false,
1063
+ "normalized": false,
1064
+ "special": true
1065
+ },
1066
+ "50161": {
1067
+ "content": "<|pad_token[113]|>",
1068
+ "single_word": false,
1069
+ "lstrip": false,
1070
+ "rstrip": false,
1071
+ "normalized": false,
1072
+ "special": true
1073
+ },
1074
+ "50162": {
1075
+ "content": "<|pad_token[114]|>",
1076
+ "single_word": false,
1077
+ "lstrip": false,
1078
+ "rstrip": false,
1079
+ "normalized": false,
1080
+ "special": true
1081
+ },
1082
+ "50163": {
1083
+ "content": "<|pad_token[115]|>",
1084
+ "single_word": false,
1085
+ "lstrip": false,
1086
+ "rstrip": false,
1087
+ "normalized": false,
1088
+ "special": true
1089
+ },
1090
+ "50164": {
1091
+ "content": "<|pad_token[116]|>",
1092
+ "single_word": false,
1093
+ "lstrip": false,
1094
+ "rstrip": false,
1095
+ "normalized": false,
1096
+ "special": true
1097
+ },
1098
+ "50165": {
1099
+ "content": "<|pad_token[117]|>",
1100
+ "single_word": false,
1101
+ "lstrip": false,
1102
+ "rstrip": false,
1103
+ "normalized": false,
1104
+ "special": true
1105
+ },
1106
+ "50166": {
1107
+ "content": "<|pad_token[118]|>",
1108
+ "single_word": false,
1109
+ "lstrip": false,
1110
+ "rstrip": false,
1111
+ "normalized": false,
1112
+ "special": true
1113
+ },
1114
+ "50167": {
1115
+ "content": "<|pad_token[119]|>",
1116
+ "single_word": false,
1117
+ "lstrip": false,
1118
+ "rstrip": false,
1119
+ "normalized": false,
1120
+ "special": true
1121
+ },
1122
+ "50168": {
1123
+ "content": "<|pad_token[120]|>",
1124
+ "single_word": false,
1125
+ "lstrip": false,
1126
+ "rstrip": false,
1127
+ "normalized": false,
1128
+ "special": true
1129
+ },
1130
+ "50169": {
1131
+ "content": "<|pad_token[121]|>",
1132
+ "single_word": false,
1133
+ "lstrip": false,
1134
+ "rstrip": false,
1135
+ "normalized": false,
1136
+ "special": true
1137
+ },
1138
+ "50170": {
1139
+ "content": "<|pad_token[122]|>",
1140
+ "single_word": false,
1141
+ "lstrip": false,
1142
+ "rstrip": false,
1143
+ "normalized": false,
1144
+ "special": true
1145
+ },
1146
+ "50171": {
1147
+ "content": "<|pad_token[123]|>",
1148
+ "single_word": false,
1149
+ "lstrip": false,
1150
+ "rstrip": false,
1151
+ "normalized": false,
1152
+ "special": true
1153
+ },
1154
+ "50172": {
1155
+ "content": "<|pad_token[124]|>",
1156
+ "single_word": false,
1157
+ "lstrip": false,
1158
+ "rstrip": false,
1159
+ "normalized": false,
1160
+ "special": true
1161
+ },
1162
+ "50173": {
1163
+ "content": "<|pad_token[125]|>",
1164
+ "single_word": false,
1165
+ "lstrip": false,
1166
+ "rstrip": false,
1167
+ "normalized": false,
1168
+ "special": true
1169
+ },
1170
+ "50174": {
1171
+ "content": "<|pad_token[126]|>",
1172
+ "single_word": false,
1173
+ "lstrip": false,
1174
+ "rstrip": false,
1175
+ "normalized": false,
1176
+ "special": true
1177
+ },
1178
+ "50175": {
1179
+ "content": "<|pad_token[127]|>",
1180
+ "single_word": false,
1181
+ "lstrip": false,
1182
+ "rstrip": false,
1183
+ "normalized": false,
1184
+ "special": true
1185
+ },
1186
+ "50176": {
1187
+ "content": "<|pad_token[128]|>",
1188
+ "single_word": false,
1189
+ "lstrip": false,
1190
+ "rstrip": false,
1191
+ "normalized": false,
1192
+ "special": true
1193
+ },
1194
+ "50177": {
1195
+ "content": "<|pad_token[129]|>",
1196
+ "single_word": false,
1197
+ "lstrip": false,
1198
+ "rstrip": false,
1199
+ "normalized": false,
1200
+ "special": true
1201
+ },
1202
+ "50178": {
1203
+ "content": "<|pad_token[130]|>",
1204
+ "single_word": false,
1205
+ "lstrip": false,
1206
+ "rstrip": false,
1207
+ "normalized": false,
1208
+ "special": true
1209
+ },
1210
+ "50179": {
1211
+ "content": "<|pad_token[131]|>",
1212
+ "single_word": false,
1213
+ "lstrip": false,
1214
+ "rstrip": false,
1215
+ "normalized": false,
1216
+ "special": true
1217
+ },
1218
+ "50180": {
1219
+ "content": "<|pad_token[132]|>",
1220
+ "single_word": false,
1221
+ "lstrip": false,
1222
+ "rstrip": false,
1223
+ "normalized": false,
1224
+ "special": true
1225
+ },
1226
+ "50181": {
1227
+ "content": "<|pad_token[133]|>",
1228
+ "single_word": false,
1229
+ "lstrip": false,
1230
+ "rstrip": false,
1231
+ "normalized": false,
1232
+ "special": true
1233
+ },
1234
+ "50182": {
1235
+ "content": "<|pad_token[134]|>",
1236
+ "single_word": false,
1237
+ "lstrip": false,
1238
+ "rstrip": false,
1239
+ "normalized": false,
1240
+ "special": true
1241
+ },
1242
+ "50183": {
1243
+ "content": "<|pad_token[135]|>",
1244
+ "single_word": false,
1245
+ "lstrip": false,
1246
+ "rstrip": false,
1247
+ "normalized": false,
1248
+ "special": true
1249
+ },
1250
+ "50184": {
1251
+ "content": "<|pad_token[136]|>",
1252
+ "single_word": false,
1253
+ "lstrip": false,
1254
+ "rstrip": false,
1255
+ "normalized": false,
1256
+ "special": true
1257
+ },
1258
+ "50185": {
1259
+ "content": "<|pad_token[137]|>",
1260
+ "single_word": false,
1261
+ "lstrip": false,
1262
+ "rstrip": false,
1263
+ "normalized": false,
1264
+ "special": true
1265
+ },
1266
+ "50186": {
1267
+ "content": "<|pad_token[138]|>",
1268
+ "single_word": false,
1269
+ "lstrip": false,
1270
+ "rstrip": false,
1271
+ "normalized": false,
1272
+ "special": true
1273
+ },
1274
+ "50187": {
1275
+ "content": "<|pad_token[139]|>",
1276
+ "single_word": false,
1277
+ "lstrip": false,
1278
+ "rstrip": false,
1279
+ "normalized": false,
1280
+ "special": true
1281
+ },
1282
+ "50188": {
1283
+ "content": "<|pad_token[140]|>",
1284
+ "single_word": false,
1285
+ "lstrip": false,
1286
+ "rstrip": false,
1287
+ "normalized": false,
1288
+ "special": true
1289
+ },
1290
+ "50189": {
1291
+ "content": "<|pad_token[141]|>",
1292
+ "single_word": false,
1293
+ "lstrip": false,
1294
+ "rstrip": false,
1295
+ "normalized": false,
1296
+ "special": true
1297
+ },
1298
+ "50190": {
1299
+ "content": "<|pad_token[142]|>",
1300
+ "single_word": false,
1301
+ "lstrip": false,
1302
+ "rstrip": false,
1303
+ "normalized": false,
1304
+ "special": true
1305
+ },
1306
+ "50191": {
1307
+ "content": "<|pad_token[143]|>",
1308
+ "single_word": false,
1309
+ "lstrip": false,
1310
+ "rstrip": false,
1311
+ "normalized": false,
1312
+ "special": true
1313
+ },
1314
+ "50192": {
1315
+ "content": "<|pad_token[144]|>",
1316
+ "single_word": false,
1317
+ "lstrip": false,
1318
+ "rstrip": false,
1319
+ "normalized": false,
1320
+ "special": true
1321
+ },
1322
+ "50193": {
1323
+ "content": "<|pad_token[145]|>",
1324
+ "single_word": false,
1325
+ "lstrip": false,
1326
+ "rstrip": false,
1327
+ "normalized": false,
1328
+ "special": true
1329
+ },
1330
+ "50194": {
1331
+ "content": "<|pad_token[146]|>",
1332
+ "single_word": false,
1333
+ "lstrip": false,
1334
+ "rstrip": false,
1335
+ "normalized": false,
1336
+ "special": true
1337
+ },
1338
+ "50195": {
1339
+ "content": "<|pad_token[147]|>",
1340
+ "single_word": false,
1341
+ "lstrip": false,
1342
+ "rstrip": false,
1343
+ "normalized": false,
1344
+ "special": true
1345
+ },
1346
+ "50196": {
1347
+ "content": "<|pad_token[148]|>",
1348
+ "single_word": false,
1349
+ "lstrip": false,
1350
+ "rstrip": false,
1351
+ "normalized": false,
1352
+ "special": true
1353
+ },
1354
+ "50197": {
1355
+ "content": "<|pad_token[149]|>",
1356
+ "single_word": false,
1357
+ "lstrip": false,
1358
+ "rstrip": false,
1359
+ "normalized": false,
1360
+ "special": true
1361
+ },
1362
+ "50198": {
1363
+ "content": "<|pad_token[150]|>",
1364
+ "single_word": false,
1365
+ "lstrip": false,
1366
+ "rstrip": false,
1367
+ "normalized": false,
1368
+ "special": true
1369
+ },
1370
+ "50199": {
1371
+ "content": "<|pad_token[151]|>",
1372
+ "single_word": false,
1373
+ "lstrip": false,
1374
+ "rstrip": false,
1375
+ "normalized": false,
1376
+ "special": true
1377
+ },
1378
+ "50200": {
1379
+ "content": "<|pad_token[152]|>",
1380
+ "single_word": false,
1381
+ "lstrip": false,
1382
+ "rstrip": false,
1383
+ "normalized": false,
1384
+ "special": true
1385
+ },
1386
+ "50201": {
1387
+ "content": "<|pad_token[153]|>",
1388
+ "single_word": false,
1389
+ "lstrip": false,
1390
+ "rstrip": false,
1391
+ "normalized": false,
1392
+ "special": true
1393
+ },
1394
+ "50202": {
1395
+ "content": "<|pad_token[154]|>",
1396
+ "single_word": false,
1397
+ "lstrip": false,
1398
+ "rstrip": false,
1399
+ "normalized": false,
1400
+ "special": true
1401
+ },
1402
+ "50203": {
1403
+ "content": "<|pad_token[155]|>",
1404
+ "single_word": false,
1405
+ "lstrip": false,
1406
+ "rstrip": false,
1407
+ "normalized": false,
1408
+ "special": true
1409
+ },
1410
+ "50204": {
1411
+ "content": "<|pad_token[156]|>",
1412
+ "single_word": false,
1413
+ "lstrip": false,
1414
+ "rstrip": false,
1415
+ "normalized": false,
1416
+ "special": true
1417
+ },
1418
+ "50205": {
1419
+ "content": "<|pad_token[157]|>",
1420
+ "single_word": false,
1421
+ "lstrip": false,
1422
+ "rstrip": false,
1423
+ "normalized": false,
1424
+ "special": true
1425
+ },
1426
+ "50206": {
1427
+ "content": "<|pad_token[158]|>",
1428
+ "single_word": false,
1429
+ "lstrip": false,
1430
+ "rstrip": false,
1431
+ "normalized": false,
1432
+ "special": true
1433
+ },
1434
+ "50207": {
1435
+ "content": "<|pad_token[159]|>",
1436
+ "single_word": false,
1437
+ "lstrip": false,
1438
+ "rstrip": false,
1439
+ "normalized": false,
1440
+ "special": true
1441
+ },
1442
+ "50208": {
1443
+ "content": "<|pad_token[160]|>",
1444
+ "single_word": false,
1445
+ "lstrip": false,
1446
+ "rstrip": false,
1447
+ "normalized": false,
1448
+ "special": true
1449
+ },
1450
+ "50209": {
1451
+ "content": "<|pad_token[161]|>",
1452
+ "single_word": false,
1453
+ "lstrip": false,
1454
+ "rstrip": false,
1455
+ "normalized": false,
1456
+ "special": true
1457
+ },
1458
+ "50210": {
1459
+ "content": "<|pad_token[162]|>",
1460
+ "single_word": false,
1461
+ "lstrip": false,
1462
+ "rstrip": false,
1463
+ "normalized": false,
1464
+ "special": true
1465
+ },
1466
+ "50211": {
1467
+ "content": "<|pad_token[163]|>",
1468
+ "single_word": false,
1469
+ "lstrip": false,
1470
+ "rstrip": false,
1471
+ "normalized": false,
1472
+ "special": true
1473
+ },
1474
+ "50212": {
1475
+ "content": "<|pad_token[164]|>",
1476
+ "single_word": false,
1477
+ "lstrip": false,
1478
+ "rstrip": false,
1479
+ "normalized": false,
1480
+ "special": true
1481
+ },
1482
+ "50213": {
1483
+ "content": "<|pad_token[165]|>",
1484
+ "single_word": false,
1485
+ "lstrip": false,
1486
+ "rstrip": false,
1487
+ "normalized": false,
1488
+ "special": true
1489
+ },
1490
+ "50214": {
1491
+ "content": "<|pad_token[166]|>",
1492
+ "single_word": false,
1493
+ "lstrip": false,
1494
+ "rstrip": false,
1495
+ "normalized": false,
1496
+ "special": true
1497
+ },
1498
+ "50215": {
1499
+ "content": "<|pad_token[167]|>",
1500
+ "single_word": false,
1501
+ "lstrip": false,
1502
+ "rstrip": false,
1503
+ "normalized": false,
1504
+ "special": true
1505
+ },
1506
+ "50216": {
1507
+ "content": "<|pad_token[168]|>",
1508
+ "single_word": false,
1509
+ "lstrip": false,
1510
+ "rstrip": false,
1511
+ "normalized": false,
1512
+ "special": true
1513
+ },
1514
+ "50217": {
1515
+ "content": "<|pad_token[169]|>",
1516
+ "single_word": false,
1517
+ "lstrip": false,
1518
+ "rstrip": false,
1519
+ "normalized": false,
1520
+ "special": true
1521
+ },
1522
+ "50218": {
1523
+ "content": "<|pad_token[170]|>",
1524
+ "single_word": false,
1525
+ "lstrip": false,
1526
+ "rstrip": false,
1527
+ "normalized": false,
1528
+ "special": true
1529
+ },
1530
+ "50219": {
1531
+ "content": "<|pad_token[171]|>",
1532
+ "single_word": false,
1533
+ "lstrip": false,
1534
+ "rstrip": false,
1535
+ "normalized": false,
1536
+ "special": true
1537
+ },
1538
+ "50220": {
1539
+ "content": "<|pad_token[172]|>",
1540
+ "single_word": false,
1541
+ "lstrip": false,
1542
+ "rstrip": false,
1543
+ "normalized": false,
1544
+ "special": true
1545
+ },
1546
+ "50221": {
1547
+ "content": "<|pad_token[173]|>",
1548
+ "single_word": false,
1549
+ "lstrip": false,
1550
+ "rstrip": false,
1551
+ "normalized": false,
1552
+ "special": true
1553
+ },
1554
+ "50222": {
1555
+ "content": "<|pad_token[174]|>",
1556
+ "single_word": false,
1557
+ "lstrip": false,
1558
+ "rstrip": false,
1559
+ "normalized": false,
1560
+ "special": true
1561
+ },
1562
+ "50223": {
1563
+ "content": "<|pad_token[175]|>",
1564
+ "single_word": false,
1565
+ "lstrip": false,
1566
+ "rstrip": false,
1567
+ "normalized": false,
1568
+ "special": true
1569
+ },
1570
+ "50224": {
1571
+ "content": "<|pad_token[176]|>",
1572
+ "single_word": false,
1573
+ "lstrip": false,
1574
+ "rstrip": false,
1575
+ "normalized": false,
1576
+ "special": true
1577
+ },
1578
+ "50225": {
1579
+ "content": "<|pad_token[177]|>",
1580
+ "single_word": false,
1581
+ "lstrip": false,
1582
+ "rstrip": false,
1583
+ "normalized": false,
1584
+ "special": true
1585
+ },
1586
+ "50226": {
1587
+ "content": "<|pad_token[178]|>",
1588
+ "single_word": false,
1589
+ "lstrip": false,
1590
+ "rstrip": false,
1591
+ "normalized": false,
1592
+ "special": true
1593
+ },
1594
+ "50227": {
1595
+ "content": "<|pad_token[179]|>",
1596
+ "single_word": false,
1597
+ "lstrip": false,
1598
+ "rstrip": false,
1599
+ "normalized": false,
1600
+ "special": true
1601
+ },
1602
+ "50228": {
1603
+ "content": "<|pad_token[180]|>",
1604
+ "single_word": false,
1605
+ "lstrip": false,
1606
+ "rstrip": false,
1607
+ "normalized": false,
1608
+ "special": true
1609
+ },
1610
+ "50229": {
1611
+ "content": "<|pad_token[181]|>",
1612
+ "single_word": false,
1613
+ "lstrip": false,
1614
+ "rstrip": false,
1615
+ "normalized": false,
1616
+ "special": true
1617
+ },
1618
+ "50230": {
1619
+ "content": "<|pad_token[182]|>",
1620
+ "single_word": false,
1621
+ "lstrip": false,
1622
+ "rstrip": false,
1623
+ "normalized": false,
1624
+ "special": true
1625
+ },
1626
+ "50231": {
1627
+ "content": "<|pad_token[183]|>",
1628
+ "single_word": false,
1629
+ "lstrip": false,
1630
+ "rstrip": false,
1631
+ "normalized": false,
1632
+ "special": true
1633
+ },
1634
+ "50232": {
1635
+ "content": "<|pad_token[184]|>",
1636
+ "single_word": false,
1637
+ "lstrip": false,
1638
+ "rstrip": false,
1639
+ "normalized": false,
1640
+ "special": true
1641
+ },
1642
+ "50233": {
1643
+ "content": "<|pad_token[185]|>",
1644
+ "single_word": false,
1645
+ "lstrip": false,
1646
+ "rstrip": false,
1647
+ "normalized": false,
1648
+ "special": true
1649
+ },
1650
+ "50234": {
1651
+ "content": "<|pad_token[186]|>",
1652
+ "single_word": false,
1653
+ "lstrip": false,
1654
+ "rstrip": false,
1655
+ "normalized": false,
1656
+ "special": true
1657
+ },
1658
+ "50235": {
1659
+ "content": "<|pad_token[187]|>",
1660
+ "single_word": false,
1661
+ "lstrip": false,
1662
+ "rstrip": false,
1663
+ "normalized": false,
1664
+ "special": true
1665
+ },
1666
+ "50236": {
1667
+ "content": "<|pad_token[188]|>",
1668
+ "single_word": false,
1669
+ "lstrip": false,
1670
+ "rstrip": false,
1671
+ "normalized": false,
1672
+ "special": true
1673
+ },
1674
+ "50237": {
1675
+ "content": "<|pad_token[189]|>",
1676
+ "single_word": false,
1677
+ "lstrip": false,
1678
+ "rstrip": false,
1679
+ "normalized": false,
1680
+ "special": true
1681
+ },
1682
+ "50238": {
1683
+ "content": "<|pad_token[190]|>",
1684
+ "single_word": false,
1685
+ "lstrip": false,
1686
+ "rstrip": false,
1687
+ "normalized": false,
1688
+ "special": true
1689
+ },
1690
+ "50239": {
1691
+ "content": "<|pad_token[191]|>",
1692
+ "single_word": false,
1693
+ "lstrip": false,
1694
+ "rstrip": false,
1695
+ "normalized": false,
1696
+ "special": true
1697
+ },
1698
+ "50240": {
1699
+ "content": "<|pad_token[192]|>",
1700
+ "single_word": false,
1701
+ "lstrip": false,
1702
+ "rstrip": false,
1703
+ "normalized": false,
1704
+ "special": true
1705
+ },
1706
+ "50241": {
1707
+ "content": "<|pad_token[193]|>",
1708
+ "single_word": false,
1709
+ "lstrip": false,
1710
+ "rstrip": false,
1711
+ "normalized": false,
1712
+ "special": true
1713
+ },
1714
+ "50242": {
1715
+ "content": "<|pad_token[194]|>",
1716
+ "single_word": false,
1717
+ "lstrip": false,
1718
+ "rstrip": false,
1719
+ "normalized": false,
1720
+ "special": true
1721
+ },
1722
+ "50243": {
1723
+ "content": "<|pad_token[195]|>",
1724
+ "single_word": false,
1725
+ "lstrip": false,
1726
+ "rstrip": false,
1727
+ "normalized": false,
1728
+ "special": true
1729
+ },
1730
+ "50244": {
1731
+ "content": "<|pad_token[196]|>",
1732
+ "single_word": false,
1733
+ "lstrip": false,
1734
+ "rstrip": false,
1735
+ "normalized": false,
1736
+ "special": true
1737
+ },
1738
+ "50245": {
1739
+ "content": "<|pad_token[197]|>",
1740
+ "single_word": false,
1741
+ "lstrip": false,
1742
+ "rstrip": false,
1743
+ "normalized": false,
1744
+ "special": true
1745
+ },
1746
+ "50246": {
1747
+ "content": "<|pad_token[198]|>",
1748
+ "single_word": false,
1749
+ "lstrip": false,
1750
+ "rstrip": false,
1751
+ "normalized": false,
1752
+ "special": true
1753
+ },
1754
+ "50247": {
1755
+ "content": "<|pad_token[199]|>",
1756
+ "single_word": false,
1757
+ "lstrip": false,
1758
+ "rstrip": false,
1759
+ "normalized": false,
1760
+ "special": true
1761
+ },
1762
+ "50248": {
1763
+ "content": "<|pad_token[200]|>",
1764
+ "single_word": false,
1765
+ "lstrip": false,
1766
+ "rstrip": false,
1767
+ "normalized": false,
1768
+ "special": true
1769
+ },
1770
+ "50249": {
1771
+ "content": "<|pad_token[201]|>",
1772
+ "single_word": false,
1773
+ "lstrip": false,
1774
+ "rstrip": false,
1775
+ "normalized": false,
1776
+ "special": true
1777
+ },
1778
+ "50250": {
1779
+ "content": "<|pad_token[202]|>",
1780
+ "single_word": false,
1781
+ "lstrip": false,
1782
+ "rstrip": false,
1783
+ "normalized": false,
1784
+ "special": true
1785
+ },
1786
+ "50251": {
1787
+ "content": "<|pad_token[203]|>",
1788
+ "single_word": false,
1789
+ "lstrip": false,
1790
+ "rstrip": false,
1791
+ "normalized": false,
1792
+ "special": true
1793
+ },
1794
+ "50252": {
1795
+ "content": "<|pad_token[204]|>",
1796
+ "single_word": false,
1797
+ "lstrip": false,
1798
+ "rstrip": false,
1799
+ "normalized": false,
1800
+ "special": true
1801
+ },
1802
+ "50253": {
1803
+ "content": "<|pad_token[205]|>",
1804
+ "single_word": false,
1805
+ "lstrip": false,
1806
+ "rstrip": false,
1807
+ "normalized": false,
1808
+ "special": true
1809
+ },
1810
+ "50254": {
1811
+ "content": "<|pad_token[206]|>",
1812
+ "single_word": false,
1813
+ "lstrip": false,
1814
+ "rstrip": false,
1815
+ "normalized": false,
1816
+ "special": true
1817
+ },
1818
+ "50255": {
1819
+ "content": "<|pad_token[207]|>",
1820
+ "single_word": false,
1821
+ "lstrip": false,
1822
+ "rstrip": false,
1823
+ "normalized": false,
1824
+ "special": true
1825
+ },
1826
+ "50256": {
1827
+ "content": "<|pad_token[208]|>",
1828
+ "single_word": false,
1829
+ "lstrip": false,
1830
+ "rstrip": false,
1831
+ "normalized": false,
1832
+ "special": true
1833
+ },
1834
+ "50257": {
1835
+ "content": "<|pad_token[209]|>",
1836
+ "single_word": false,
1837
+ "lstrip": false,
1838
+ "rstrip": false,
1839
+ "normalized": false,
1840
+ "special": true
1841
+ },
1842
+ "50258": {
1843
+ "content": "<|pad_token[210]|>",
1844
+ "single_word": false,
1845
+ "lstrip": false,
1846
+ "rstrip": false,
1847
+ "normalized": false,
1848
+ "special": true
1849
+ },
1850
+ "50259": {
1851
+ "content": "<|pad_token[211]|>",
1852
+ "single_word": false,
1853
+ "lstrip": false,
1854
+ "rstrip": false,
1855
+ "normalized": false,
1856
+ "special": true
1857
+ },
1858
+ "50260": {
1859
+ "content": "<|pad_token[212]|>",
1860
+ "single_word": false,
1861
+ "lstrip": false,
1862
+ "rstrip": false,
1863
+ "normalized": false,
1864
+ "special": true
1865
+ },
1866
+ "50261": {
1867
+ "content": "<|pad_token[213]|>",
1868
+ "single_word": false,
1869
+ "lstrip": false,
1870
+ "rstrip": false,
1871
+ "normalized": false,
1872
+ "special": true
1873
+ },
1874
+ "50262": {
1875
+ "content": "<|pad_token[214]|>",
1876
+ "single_word": false,
1877
+ "lstrip": false,
1878
+ "rstrip": false,
1879
+ "normalized": false,
1880
+ "special": true
1881
+ },
1882
+ "50263": {
1883
+ "content": "<|pad_token[215]|>",
1884
+ "single_word": false,
1885
+ "lstrip": false,
1886
+ "rstrip": false,
1887
+ "normalized": false,
1888
+ "special": true
1889
+ },
1890
+ "50264": {
1891
+ "content": "<|pad_token[216]|>",
1892
+ "single_word": false,
1893
+ "lstrip": false,
1894
+ "rstrip": false,
1895
+ "normalized": false,
1896
+ "special": true
1897
+ },
1898
+ "50265": {
1899
+ "content": "<|pad_token[217]|>",
1900
+ "single_word": false,
1901
+ "lstrip": false,
1902
+ "rstrip": false,
1903
+ "normalized": false,
1904
+ "special": true
1905
+ },
1906
+ "50266": {
1907
+ "content": "<|pad_token[218]|>",
1908
+ "single_word": false,
1909
+ "lstrip": false,
1910
+ "rstrip": false,
1911
+ "normalized": false,
1912
+ "special": true
1913
+ },
1914
+ "50267": {
1915
+ "content": "<|pad_token[219]|>",
1916
+ "single_word": false,
1917
+ "lstrip": false,
1918
+ "rstrip": false,
1919
+ "normalized": false,
1920
+ "special": true
1921
+ },
1922
+ "50268": {
1923
+ "content": "<|pad_token[220]|>",
1924
+ "single_word": false,
1925
+ "lstrip": false,
1926
+ "rstrip": false,
1927
+ "normalized": false,
1928
+ "special": true
1929
+ },
1930
+ "50269": {
1931
+ "content": "<|pad_token[221]|>",
1932
+ "single_word": false,
1933
+ "lstrip": false,
1934
+ "rstrip": false,
1935
+ "normalized": false,
1936
+ "special": true
1937
+ },
1938
+ "50270": {
1939
+ "content": "<|pad_token[222]|>",
1940
+ "single_word": false,
1941
+ "lstrip": false,
1942
+ "rstrip": false,
1943
+ "normalized": false,
1944
+ "special": true
1945
+ },
1946
+ "50271": {
1947
+ "content": "<|pad_token[223]|>",
1948
+ "single_word": false,
1949
+ "lstrip": false,
1950
+ "rstrip": false,
1951
+ "normalized": false,
1952
+ "special": true
1953
+ },
1954
+ "50272": {
1955
+ "content": "<|pad_token[224]|>",
1956
+ "single_word": false,
1957
+ "lstrip": false,
1958
+ "rstrip": false,
1959
+ "normalized": false,
1960
+ "special": true
1961
+ },
1962
+ "50273": {
1963
+ "content": "<|pad_token[225]|>",
1964
+ "single_word": false,
1965
+ "lstrip": false,
1966
+ "rstrip": false,
1967
+ "normalized": false,
1968
+ "special": true
1969
+ },
1970
+ "50274": {
1971
+ "content": "<|pad_token[226]|>",
1972
+ "single_word": false,
1973
+ "lstrip": false,
1974
+ "rstrip": false,
1975
+ "normalized": false,
1976
+ "special": true
1977
+ },
1978
+ "50275": {
1979
+ "content": "<|pad_token[227]|>",
1980
+ "single_word": false,
1981
+ "lstrip": false,
1982
+ "rstrip": false,
1983
+ "normalized": false,
1984
+ "special": true
1985
+ },
1986
+ "50276": {
1987
+ "content": "<|pad_token[228]|>",
1988
+ "single_word": false,
1989
+ "lstrip": false,
1990
+ "rstrip": false,
1991
+ "normalized": false,
1992
+ "special": true
1993
+ },
1994
+ "50277": {
1995
+ "content": "<|pad_token[229]|>",
1996
+ "single_word": false,
1997
+ "lstrip": false,
1998
+ "rstrip": false,
1999
+ "normalized": false,
2000
+ "special": true
2001
+ },
2002
+ "50278": {
2003
+ "content": "<|pad_token[230]|>",
2004
+ "single_word": false,
2005
+ "lstrip": false,
2006
+ "rstrip": false,
2007
+ "normalized": false,
2008
+ "special": true
2009
+ },
2010
+ "50279": {
2011
+ "content": "<|pad_token[231]|>",
2012
+ "single_word": false,
2013
+ "lstrip": false,
2014
+ "rstrip": false,
2015
+ "normalized": false,
2016
+ "special": true
2017
+ },
2018
+ "50280": {
2019
+ "content": "<|pad_token[232]|>",
2020
+ "single_word": false,
2021
+ "lstrip": false,
2022
+ "rstrip": false,
2023
+ "normalized": false,
2024
+ "special": true
2025
+ },
2026
+ "50281": {
2027
+ "content": "<|pad_token[233]|>",
2028
+ "single_word": false,
2029
+ "lstrip": false,
2030
+ "rstrip": false,
2031
+ "normalized": false,
2032
+ "special": true
2033
+ },
2034
+ "50282": {
2035
+ "content": "<|pad_token[234]|>",
2036
+ "single_word": false,
2037
+ "lstrip": false,
2038
+ "rstrip": false,
2039
+ "normalized": false,
2040
+ "special": true
2041
+ },
2042
+ "50283": {
2043
+ "content": "<|pad_token[235]|>",
2044
+ "single_word": false,
2045
+ "lstrip": false,
2046
+ "rstrip": false,
2047
+ "normalized": false,
2048
+ "special": true
2049
+ },
2050
+ "50284": {
2051
+ "content": "<|pad_token[236]|>",
2052
+ "single_word": false,
2053
+ "lstrip": false,
2054
+ "rstrip": false,
2055
+ "normalized": false,
2056
+ "special": true
2057
+ },
2058
+ "50285": {
2059
+ "content": "<|pad_token[237]|>",
2060
+ "single_word": false,
2061
+ "lstrip": false,
2062
+ "rstrip": false,
2063
+ "normalized": false,
2064
+ "special": true
2065
+ },
2066
+ "50286": {
2067
+ "content": "<|pad_token[238]|>",
2068
+ "single_word": false,
2069
+ "lstrip": false,
2070
+ "rstrip": false,
2071
+ "normalized": false,
2072
+ "special": true
2073
+ },
2074
+ "50287": {
2075
+ "content": "<|pad_token[239]|>",
2076
+ "single_word": false,
2077
+ "lstrip": false,
2078
+ "rstrip": false,
2079
+ "normalized": false,
2080
+ "special": true
2081
+ },
2082
+ "50288": {
2083
+ "content": "<|pad_token[240]|>",
2084
+ "single_word": false,
2085
+ "lstrip": false,
2086
+ "rstrip": false,
2087
+ "normalized": false,
2088
+ "special": true
2089
+ },
2090
+ "50289": {
2091
+ "content": "<|pad_token[241]|>",
2092
+ "single_word": false,
2093
+ "lstrip": false,
2094
+ "rstrip": false,
2095
+ "normalized": false,
2096
+ "special": true
2097
+ },
2098
+ "50290": {
2099
+ "content": "<|pad_token[242]|>",
2100
+ "single_word": false,
2101
+ "lstrip": false,
2102
+ "rstrip": false,
2103
+ "normalized": false,
2104
+ "special": true
2105
+ },
2106
+ "50291": {
2107
+ "content": "<|pad_token[243]|>",
2108
+ "single_word": false,
2109
+ "lstrip": false,
2110
+ "rstrip": false,
2111
+ "normalized": false,
2112
+ "special": true
2113
+ },
2114
+ "50292": {
2115
+ "content": "<|pad_token[244]|>",
2116
+ "single_word": false,
2117
+ "lstrip": false,
2118
+ "rstrip": false,
2119
+ "normalized": false,
2120
+ "special": true
2121
+ },
2122
+ "50293": {
2123
+ "content": "<|pad_token[245]|>",
2124
+ "single_word": false,
2125
+ "lstrip": false,
2126
+ "rstrip": false,
2127
+ "normalized": false,
2128
+ "special": true
2129
+ },
2130
+ "50294": {
2131
+ "content": "<|pad_token[246]|>",
2132
+ "single_word": false,
2133
+ "lstrip": false,
2134
+ "rstrip": false,
2135
+ "normalized": false,
2136
+ "special": true
2137
+ },
2138
+ "50295": {
2139
+ "content": "<|pad_token[247]|>",
2140
+ "single_word": false,
2141
+ "lstrip": false,
2142
+ "rstrip": false,
2143
+ "normalized": false,
2144
+ "special": true
2145
+ },
2146
+ "50296": {
2147
+ "content": "<|pad_token[248]|>",
2148
+ "single_word": false,
2149
+ "lstrip": false,
2150
+ "rstrip": false,
2151
+ "normalized": false,
2152
+ "special": true
2153
+ },
2154
+ "50297": {
2155
+ "content": "<|pad_token[249]|>",
2156
+ "single_word": false,
2157
+ "lstrip": false,
2158
+ "rstrip": false,
2159
+ "normalized": false,
2160
+ "special": true
2161
+ },
2162
+ "50298": {
2163
+ "content": "<|pad_token[250]|>",
2164
+ "single_word": false,
2165
+ "lstrip": false,
2166
+ "rstrip": false,
2167
+ "normalized": false,
2168
+ "special": true
2169
+ },
2170
+ "50299": {
2171
+ "content": "<|pad_token[251]|>",
2172
+ "single_word": false,
2173
+ "lstrip": false,
2174
+ "rstrip": false,
2175
+ "normalized": false,
2176
+ "special": true
2177
+ },
2178
+ "50300": {
2179
+ "content": "<|pad_token[252]|>",
2180
+ "single_word": false,
2181
+ "lstrip": false,
2182
+ "rstrip": false,
2183
+ "normalized": false,
2184
+ "special": true
2185
+ },
2186
+ "50301": {
2187
+ "content": "<|pad_token[253]|>",
2188
+ "single_word": false,
2189
+ "lstrip": false,
2190
+ "rstrip": false,
2191
+ "normalized": false,
2192
+ "special": true
2193
+ },
2194
+ "50302": {
2195
+ "content": "<|pad_token[254]|>",
2196
+ "single_word": false,
2197
+ "lstrip": false,
2198
+ "rstrip": false,
2199
+ "normalized": false,
2200
+ "special": true
2201
+ },
2202
+ "50303": {
2203
+ "content": "<|pad_token[255]|>",
2204
+ "single_word": false,
2205
+ "lstrip": false,
2206
+ "rstrip": false,
2207
+ "normalized": false,
2208
+ "special": true
2209
  }
2210
  }
2211
  }
last-checkpoint/trainer_state.json CHANGED
@@ -3,1383 +3,1117 @@
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
  "epoch": 0.01,
6
- "eval_steps": 3900,
7
- "global_step": 390,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
- "epoch": 5.128205128205128e-05,
14
- "grad_norm": 6.96875,
15
- "learning_rate": 0.0005128205128205128,
16
- "loss": 11.028623580932617,
17
  "step": 2
18
  },
19
  {
20
- "epoch": 0.00010256410256410256,
21
- "grad_norm": 5.9375,
22
- "learning_rate": 0.0010256410256410256,
23
- "loss": 10.835494041442871,
24
  "step": 4
25
  },
26
  {
27
- "epoch": 0.00015384615384615385,
28
- "grad_norm": 5.25,
29
- "learning_rate": 0.0015384615384615387,
30
- "loss": 10.626424789428711,
31
  "step": 6
32
  },
33
  {
34
- "epoch": 0.00020512820512820512,
35
- "grad_norm": 4.96875,
36
- "learning_rate": 0.0020512820512820513,
37
- "loss": 10.43354606628418,
38
  "step": 8
39
  },
40
  {
41
- "epoch": 0.0002564102564102564,
42
- "grad_norm": 4.53125,
43
- "learning_rate": 0.002564102564102564,
44
- "loss": 10.232170104980469,
45
  "step": 10
46
  },
47
  {
48
- "epoch": 0.0003076923076923077,
49
- "grad_norm": 3.671875,
50
- "learning_rate": 0.0030769230769230774,
51
- "loss": 9.962776184082031,
52
  "step": 12
53
  },
54
  {
55
- "epoch": 0.000358974358974359,
56
- "grad_norm": 3.015625,
57
- "learning_rate": 0.00358974358974359,
58
- "loss": 9.638317108154297,
59
  "step": 14
60
  },
61
  {
62
- "epoch": 0.00041025641025641023,
63
- "grad_norm": 2.453125,
64
- "learning_rate": 0.0041025641025641026,
65
- "loss": 9.297982215881348,
66
  "step": 16
67
  },
68
  {
69
- "epoch": 0.00046153846153846153,
70
- "grad_norm": 2.734375,
71
- "learning_rate": 0.004615384615384616,
72
- "loss": 8.92674732208252,
73
  "step": 18
74
  },
75
  {
76
- "epoch": 0.0005128205128205128,
77
- "grad_norm": 2.765625,
78
- "learning_rate": 0.005128205128205128,
79
- "loss": 8.53368091583252,
80
  "step": 20
81
  },
82
  {
83
- "epoch": 0.0005641025641025641,
84
- "grad_norm": 3.390625,
85
- "learning_rate": 0.0056410256410256415,
86
- "loss": 8.150374412536621,
87
  "step": 22
88
  },
89
  {
90
- "epoch": 0.0006153846153846154,
91
- "grad_norm": 3.671875,
92
- "learning_rate": 0.006153846153846155,
93
- "loss": 7.803437232971191,
94
  "step": 24
95
  },
96
  {
97
- "epoch": 0.0006666666666666666,
98
- "grad_norm": 3.75,
99
- "learning_rate": 0.006666666666666667,
100
- "loss": 7.4913330078125,
101
  "step": 26
102
  },
103
  {
104
- "epoch": 0.000717948717948718,
105
- "grad_norm": 3.8125,
106
- "learning_rate": 0.00717948717948718,
107
- "loss": 7.2185750007629395,
108
  "step": 28
109
  },
110
  {
111
- "epoch": 0.0007692307692307692,
112
- "grad_norm": 5.09375,
113
- "learning_rate": 0.007692307692307693,
114
- "loss": 6.9673566818237305,
115
  "step": 30
116
  },
117
  {
118
- "epoch": 0.0008205128205128205,
119
- "grad_norm": 7.03125,
120
- "learning_rate": 0.008205128205128205,
121
- "loss": 6.730362892150879,
122
  "step": 32
123
  },
124
  {
125
- "epoch": 0.0008717948717948718,
126
- "grad_norm": 8.875,
127
- "learning_rate": 0.00871794871794872,
128
- "loss": 6.566787242889404,
129
  "step": 34
130
  },
131
  {
132
- "epoch": 0.0009230769230769231,
133
- "grad_norm": 8.375,
134
- "learning_rate": 0.009230769230769232,
135
- "loss": 6.36342716217041,
136
  "step": 36
137
  },
138
  {
139
- "epoch": 0.0009743589743589744,
140
- "grad_norm": 8.375,
141
- "learning_rate": 0.009743589743589744,
142
- "loss": 6.160152435302734,
143
  "step": 38
144
  },
145
  {
146
- "epoch": 0.0010256410256410256,
147
- "grad_norm": 8.375,
148
- "learning_rate": 0.010256410256410256,
149
- "loss": 6.030362129211426,
150
  "step": 40
151
  },
152
  {
153
- "epoch": 0.0010769230769230769,
154
- "grad_norm": 7.59375,
155
- "learning_rate": 0.01076923076923077,
156
- "loss": 5.868592739105225,
157
  "step": 42
158
  },
159
  {
160
- "epoch": 0.0011282051282051281,
161
- "grad_norm": 7.21875,
162
- "learning_rate": 0.011282051282051283,
163
- "loss": 5.7172956466674805,
164
  "step": 44
165
  },
166
  {
167
- "epoch": 0.0011794871794871796,
168
- "grad_norm": 7.0,
169
- "learning_rate": 0.011794871794871797,
170
- "loss": 5.569025993347168,
171
  "step": 46
172
  },
173
  {
174
- "epoch": 0.0012307692307692308,
175
- "grad_norm": 6.46875,
176
- "learning_rate": 0.01230769230769231,
177
- "loss": 5.417316436767578,
178
  "step": 48
179
  },
180
  {
181
- "epoch": 0.001282051282051282,
182
- "grad_norm": 5.53125,
183
- "learning_rate": 0.01282051282051282,
184
- "loss": 5.258627414703369,
185
  "step": 50
186
  },
187
  {
188
- "epoch": 0.0013333333333333333,
189
- "grad_norm": 5.78125,
190
- "learning_rate": 0.013333333333333334,
191
- "loss": 5.114855766296387,
192
  "step": 52
193
  },
194
  {
195
- "epoch": 0.0013846153846153845,
196
- "grad_norm": 4.34375,
197
- "learning_rate": 0.013846153846153847,
198
- "loss": 4.965922832489014,
199
  "step": 54
200
  },
201
  {
202
- "epoch": 0.001435897435897436,
203
- "grad_norm": 3.296875,
204
- "learning_rate": 0.01435897435897436,
205
- "loss": 4.81715726852417,
206
  "step": 56
207
  },
208
  {
209
- "epoch": 0.0014871794871794872,
210
- "grad_norm": 3.0625,
211
- "learning_rate": 0.014871794871794873,
212
- "loss": 4.687244415283203,
213
  "step": 58
214
  },
215
  {
216
- "epoch": 0.0015384615384615385,
217
- "grad_norm": 1.96875,
218
- "learning_rate": 0.015384615384615385,
219
- "loss": 4.546048164367676,
220
  "step": 60
221
  },
222
  {
223
- "epoch": 0.0015897435897435897,
224
- "grad_norm": 2.03125,
225
- "learning_rate": 0.015897435897435898,
226
- "loss": 4.4834818840026855,
227
  "step": 62
228
  },
229
  {
230
- "epoch": 0.001641025641025641,
231
- "grad_norm": 2.171875,
232
- "learning_rate": 0.01641025641025641,
233
- "loss": 4.364042282104492,
234
  "step": 64
235
  },
236
  {
237
- "epoch": 0.0016923076923076924,
238
- "grad_norm": 2.4375,
239
- "learning_rate": 0.016923076923076926,
240
- "loss": 4.284972667694092,
241
  "step": 66
242
  },
243
  {
244
- "epoch": 0.0017435897435897436,
245
- "grad_norm": 1.8828125,
246
- "learning_rate": 0.01743589743589744,
247
- "loss": 4.193305492401123,
248
  "step": 68
249
  },
250
  {
251
- "epoch": 0.0017948717948717949,
252
- "grad_norm": 1.625,
253
- "learning_rate": 0.017948717948717947,
254
- "loss": 4.111180305480957,
255
  "step": 70
256
  },
257
  {
258
- "epoch": 0.0018461538461538461,
259
- "grad_norm": 1.1953125,
260
- "learning_rate": 0.018461538461538463,
261
- "loss": 4.065956115722656,
262
  "step": 72
263
  },
264
  {
265
- "epoch": 0.0018974358974358973,
266
- "grad_norm": 1.3671875,
267
- "learning_rate": 0.018974358974358976,
268
- "loss": 3.992979049682617,
269
  "step": 74
270
  },
271
  {
272
- "epoch": 0.0019487179487179488,
273
- "grad_norm": 1.09375,
274
- "learning_rate": 0.019487179487179488,
275
- "loss": 3.9563088417053223,
276
  "step": 76
277
  },
278
  {
279
- "epoch": 0.002,
280
- "grad_norm": 1.140625,
281
- "learning_rate": 0.02,
282
- "loss": 3.9258062839508057,
283
  "step": 78
284
  },
285
  {
286
- "epoch": 0.0020512820512820513,
287
- "grad_norm": 1.0625,
288
- "learning_rate": 0.020512820512820513,
289
- "loss": 3.8419349193573,
290
  "step": 80
291
  },
292
  {
293
- "epoch": 0.0021025641025641025,
294
- "grad_norm": 0.97265625,
295
- "learning_rate": 0.02102564102564103,
296
- "loss": 3.8219480514526367,
297
  "step": 82
298
  },
299
  {
300
- "epoch": 0.0021538461538461538,
301
- "grad_norm": 0.90625,
302
- "learning_rate": 0.02153846153846154,
303
- "loss": 3.7782399654388428,
304
  "step": 84
305
  },
306
  {
307
- "epoch": 0.002205128205128205,
308
- "grad_norm": 0.9453125,
309
- "learning_rate": 0.02205128205128205,
310
- "loss": 3.740063428878784,
311
  "step": 86
312
  },
313
  {
314
- "epoch": 0.0022564102564102562,
315
- "grad_norm": 0.96484375,
316
- "learning_rate": 0.022564102564102566,
317
- "loss": 3.693281888961792,
318
  "step": 88
319
  },
320
  {
321
- "epoch": 0.002307692307692308,
322
- "grad_norm": 0.9609375,
323
- "learning_rate": 0.023076923076923078,
324
- "loss": 3.677046775817871,
325
  "step": 90
326
  },
327
  {
328
- "epoch": 0.002358974358974359,
329
- "grad_norm": 0.78125,
330
- "learning_rate": 0.023589743589743594,
331
- "loss": 3.6315693855285645,
332
  "step": 92
333
  },
334
  {
335
- "epoch": 0.0024102564102564104,
336
- "grad_norm": 1.0078125,
337
- "learning_rate": 0.024102564102564103,
338
- "loss": 3.597317695617676,
339
  "step": 94
340
  },
341
  {
342
- "epoch": 0.0024615384615384616,
343
- "grad_norm": 0.6640625,
344
- "learning_rate": 0.02461538461538462,
345
- "loss": 3.5555150508880615,
346
  "step": 96
347
  },
348
  {
349
- "epoch": 0.002512820512820513,
350
- "grad_norm": 0.96484375,
351
- "learning_rate": 0.02512820512820513,
352
- "loss": 3.5442092418670654,
353
  "step": 98
354
  },
355
  {
356
- "epoch": 0.002564102564102564,
357
- "grad_norm": 0.7421875,
358
- "learning_rate": 0.02564102564102564,
359
- "loss": 3.5661072731018066,
360
  "step": 100
361
  },
362
  {
363
- "epoch": 0.0026153846153846153,
364
- "grad_norm": 0.7265625,
365
- "learning_rate": 0.026153846153846156,
366
- "loss": 3.562504768371582,
367
  "step": 102
368
  },
369
  {
370
- "epoch": 0.0026666666666666666,
371
- "grad_norm": 0.703125,
372
- "learning_rate": 0.02666666666666667,
373
- "loss": 3.6011133193969727,
374
  "step": 104
375
  },
376
  {
377
- "epoch": 0.002717948717948718,
378
- "grad_norm": 0.9296875,
379
- "learning_rate": 0.027179487179487184,
380
- "loss": 3.5903480052948,
381
  "step": 106
382
  },
383
  {
384
- "epoch": 0.002769230769230769,
385
- "grad_norm": 0.62109375,
386
- "learning_rate": 0.027692307692307693,
387
- "loss": 3.62792706489563,
388
  "step": 108
389
  },
390
  {
391
- "epoch": 0.0028205128205128207,
392
- "grad_norm": 0.8046875,
393
- "learning_rate": 0.028205128205128206,
394
- "loss": 3.5491697788238525,
395
  "step": 110
396
  },
397
  {
398
- "epoch": 0.002871794871794872,
399
- "grad_norm": 0.71484375,
400
- "learning_rate": 0.02871794871794872,
401
- "loss": 3.566171169281006,
402
  "step": 112
403
  },
404
  {
405
- "epoch": 0.002923076923076923,
406
- "grad_norm": 0.75,
407
- "learning_rate": 0.02923076923076923,
408
- "loss": 3.600825309753418,
409
  "step": 114
410
  },
411
  {
412
- "epoch": 0.0029743589743589744,
413
- "grad_norm": 0.66796875,
414
- "learning_rate": 0.029743589743589746,
415
- "loss": 3.5996663570404053,
416
  "step": 116
417
  },
418
  {
419
- "epoch": 0.0030256410256410257,
420
- "grad_norm": 0.59375,
421
- "learning_rate": 0.03025641025641026,
422
- "loss": 3.5554251670837402,
423
  "step": 118
424
  },
425
  {
426
- "epoch": 0.003076923076923077,
427
- "grad_norm": 0.625,
428
- "learning_rate": 0.03076923076923077,
429
- "loss": 3.5802998542785645,
430
  "step": 120
431
  },
432
  {
433
- "epoch": 0.003128205128205128,
434
- "grad_norm": 0.578125,
435
- "learning_rate": 0.03128205128205128,
436
- "loss": 3.591398239135742,
437
  "step": 122
438
  },
439
  {
440
- "epoch": 0.0031794871794871794,
441
- "grad_norm": 0.58984375,
442
- "learning_rate": 0.031794871794871796,
443
- "loss": 3.568976879119873,
444
  "step": 124
445
  },
446
  {
447
- "epoch": 0.0032307692307692306,
448
- "grad_norm": 0.7578125,
449
- "learning_rate": 0.03230769230769231,
450
- "loss": 3.5728864669799805,
451
  "step": 126
452
  },
453
  {
454
- "epoch": 0.003282051282051282,
455
- "grad_norm": 0.53515625,
456
- "learning_rate": 0.03282051282051282,
457
- "loss": 3.572187662124634,
458
  "step": 128
459
  },
460
  {
461
- "epoch": 0.0033333333333333335,
462
- "grad_norm": 0.58203125,
463
- "learning_rate": 0.03333333333333333,
464
- "loss": 3.580453634262085,
465
  "step": 130
466
  },
467
  {
468
- "epoch": 0.003384615384615385,
469
- "grad_norm": 0.546875,
470
- "learning_rate": 0.03384615384615385,
471
- "loss": 3.5927364826202393,
472
  "step": 132
473
  },
474
  {
475
- "epoch": 0.003435897435897436,
476
- "grad_norm": 0.498046875,
477
- "learning_rate": 0.03435897435897436,
478
- "loss": 3.631333351135254,
479
  "step": 134
480
  },
481
  {
482
- "epoch": 0.0034871794871794873,
483
- "grad_norm": 0.65625,
484
- "learning_rate": 0.03487179487179488,
485
- "loss": 3.6253650188446045,
486
  "step": 136
487
  },
488
  {
489
- "epoch": 0.0035384615384615385,
490
- "grad_norm": 0.5703125,
491
- "learning_rate": 0.03538461538461539,
492
- "loss": 3.585386276245117,
493
  "step": 138
494
  },
495
  {
496
- "epoch": 0.0035897435897435897,
497
- "grad_norm": 0.53515625,
498
- "learning_rate": 0.035897435897435895,
499
- "loss": 3.608487129211426,
500
  "step": 140
501
  },
502
  {
503
- "epoch": 0.003641025641025641,
504
- "grad_norm": 0.56640625,
505
- "learning_rate": 0.036410256410256414,
506
- "loss": 3.583284378051758,
507
  "step": 142
508
  },
509
  {
510
- "epoch": 0.0036923076923076922,
511
- "grad_norm": 0.5703125,
512
- "learning_rate": 0.036923076923076927,
513
- "loss": 3.5945990085601807,
514
  "step": 144
515
  },
516
  {
517
- "epoch": 0.0037435897435897435,
518
- "grad_norm": 0.54296875,
519
- "learning_rate": 0.03743589743589744,
520
- "loss": 3.5919718742370605,
521
  "step": 146
522
  },
523
  {
524
- "epoch": 0.0037948717948717947,
525
- "grad_norm": 0.47265625,
526
- "learning_rate": 0.03794871794871795,
527
- "loss": 3.621609687805176,
528
  "step": 148
529
  },
530
  {
531
- "epoch": 0.0038461538461538464,
532
- "grad_norm": 0.546875,
533
- "learning_rate": 0.038461538461538464,
534
- "loss": 3.60060715675354,
535
  "step": 150
536
  },
537
  {
538
- "epoch": 0.0038974358974358976,
539
- "grad_norm": 0.53125,
540
- "learning_rate": 0.038974358974358976,
541
- "loss": 3.584505081176758,
542
  "step": 152
543
  },
544
  {
545
- "epoch": 0.003948717948717949,
546
- "grad_norm": 0.52734375,
547
- "learning_rate": 0.03948717948717949,
548
- "loss": 3.56527042388916,
549
  "step": 154
550
  },
551
  {
552
- "epoch": 0.004,
553
- "grad_norm": 0.51171875,
554
- "learning_rate": 0.04,
555
- "loss": 3.5620148181915283,
556
  "step": 156
557
  },
558
  {
559
- "epoch": 0.004051282051282051,
560
- "grad_norm": 0.404296875,
561
- "learning_rate": 0.04051282051282051,
562
- "loss": 3.6077682971954346,
563
  "step": 158
564
  },
565
  {
566
- "epoch": 0.0041025641025641026,
567
- "grad_norm": 0.42578125,
568
- "learning_rate": 0.041025641025641026,
569
- "loss": 3.572093963623047,
570
  "step": 160
571
  },
572
  {
573
- "epoch": 0.004153846153846154,
574
- "grad_norm": 0.453125,
575
- "learning_rate": 0.04153846153846154,
576
- "loss": 3.5625109672546387,
577
  "step": 162
578
  },
579
  {
580
- "epoch": 0.004205128205128205,
581
- "grad_norm": 0.453125,
582
- "learning_rate": 0.04205128205128206,
583
- "loss": 3.6565420627593994,
584
  "step": 164
585
  },
586
  {
587
- "epoch": 0.004256410256410256,
588
- "grad_norm": 0.4453125,
589
- "learning_rate": 0.04256410256410257,
590
- "loss": 3.5821502208709717,
591
  "step": 166
592
  },
593
  {
594
- "epoch": 0.0043076923076923075,
595
- "grad_norm": 0.375,
596
- "learning_rate": 0.04307692307692308,
597
- "loss": 3.5616493225097656,
598
  "step": 168
599
  },
600
  {
601
- "epoch": 0.004358974358974359,
602
- "grad_norm": 0.404296875,
603
- "learning_rate": 0.04358974358974359,
604
- "loss": 3.5844054222106934,
605
  "step": 170
606
  },
607
  {
608
- "epoch": 0.00441025641025641,
609
- "grad_norm": 0.484375,
610
- "learning_rate": 0.0441025641025641,
611
- "loss": 3.596921443939209,
612
  "step": 172
613
  },
614
  {
615
- "epoch": 0.004461538461538461,
616
- "grad_norm": 0.4921875,
617
- "learning_rate": 0.04461538461538462,
618
- "loss": 3.580339193344116,
619
  "step": 174
620
  },
621
  {
622
- "epoch": 0.0045128205128205125,
623
- "grad_norm": 0.46484375,
624
- "learning_rate": 0.04512820512820513,
625
- "loss": 3.540377378463745,
626
  "step": 176
627
  },
628
  {
629
- "epoch": 0.004564102564102564,
630
- "grad_norm": 0.435546875,
631
- "learning_rate": 0.045641025641025644,
632
- "loss": 3.4948010444641113,
633
  "step": 178
634
  },
635
  {
636
- "epoch": 0.004615384615384616,
637
- "grad_norm": 0.427734375,
638
- "learning_rate": 0.046153846153846156,
639
- "loss": 3.5890262126922607,
640
  "step": 180
641
  },
642
  {
643
- "epoch": 0.004666666666666667,
644
- "grad_norm": 0.435546875,
645
- "learning_rate": 0.04666666666666666,
646
- "loss": 3.5203731060028076,
647
  "step": 182
648
  },
649
  {
650
- "epoch": 0.004717948717948718,
651
- "grad_norm": 0.50390625,
652
- "learning_rate": 0.04717948717948719,
653
- "loss": 3.5634355545043945,
654
  "step": 184
655
  },
656
  {
657
- "epoch": 0.0047692307692307695,
658
- "grad_norm": 0.494140625,
659
- "learning_rate": 0.047692307692307694,
660
- "loss": 3.5992159843444824,
661
  "step": 186
662
  },
663
  {
664
- "epoch": 0.004820512820512821,
665
- "grad_norm": 0.3359375,
666
- "learning_rate": 0.048205128205128206,
667
- "loss": 3.5432937145233154,
668
  "step": 188
669
  },
670
  {
671
- "epoch": 0.004871794871794872,
672
- "grad_norm": 0.470703125,
673
- "learning_rate": 0.04871794871794872,
674
- "loss": 3.5420024394989014,
675
  "step": 190
676
  },
677
  {
678
- "epoch": 0.004923076923076923,
679
- "grad_norm": 0.376953125,
680
- "learning_rate": 0.04923076923076924,
681
- "loss": 3.5438649654388428,
682
  "step": 192
683
  },
684
  {
685
- "epoch": 0.0049743589743589745,
686
- "grad_norm": 0.46484375,
687
- "learning_rate": 0.04974358974358975,
688
- "loss": 3.558898448944092,
689
  "step": 194
690
  },
691
  {
692
- "epoch": 0.005025641025641026,
693
- "grad_norm": 0.400390625,
694
- "learning_rate": 0.05025641025641026,
695
- "loss": 3.5653491020202637,
696
  "step": 196
697
  },
698
  {
699
- "epoch": 0.005076923076923077,
700
- "grad_norm": 0.38671875,
701
- "learning_rate": 0.05076923076923077,
702
- "loss": 3.5160062313079834,
703
  "step": 198
704
  },
705
  {
706
- "epoch": 0.005128205128205128,
707
- "grad_norm": 0.373046875,
708
- "learning_rate": 0.05128205128205128,
709
- "loss": 3.634993553161621,
710
  "step": 200
711
  },
712
  {
713
- "epoch": 0.0051794871794871794,
714
- "grad_norm": 0.37109375,
715
- "learning_rate": 0.0517948717948718,
716
- "loss": 3.5891895294189453,
717
  "step": 202
718
  },
719
  {
720
- "epoch": 0.005230769230769231,
721
- "grad_norm": 0.283203125,
722
- "learning_rate": 0.05230769230769231,
723
- "loss": 3.517305612564087,
724
  "step": 204
725
  },
726
  {
727
- "epoch": 0.005282051282051282,
728
- "grad_norm": 0.365234375,
729
- "learning_rate": 0.052820512820512824,
730
- "loss": 3.5225830078125,
731
  "step": 206
732
  },
733
  {
734
- "epoch": 0.005333333333333333,
735
- "grad_norm": 0.388671875,
736
- "learning_rate": 0.05333333333333334,
737
- "loss": 3.59674334526062,
738
  "step": 208
739
  },
740
  {
741
- "epoch": 0.005384615384615384,
742
- "grad_norm": 0.3984375,
743
- "learning_rate": 0.05384615384615385,
744
- "loss": 3.568952798843384,
745
  "step": 210
746
  },
747
  {
748
- "epoch": 0.005435897435897436,
749
- "grad_norm": 0.345703125,
750
- "learning_rate": 0.05435897435897437,
751
- "loss": 3.5675606727600098,
752
  "step": 212
753
  },
754
  {
755
- "epoch": 0.005487179487179487,
756
- "grad_norm": 0.326171875,
757
- "learning_rate": 0.054871794871794874,
758
- "loss": 3.5722639560699463,
759
  "step": 214
760
  },
761
  {
762
- "epoch": 0.005538461538461538,
763
- "grad_norm": 0.37890625,
764
- "learning_rate": 0.055384615384615386,
765
- "loss": 3.578686237335205,
766
  "step": 216
767
  },
768
  {
769
- "epoch": 0.005589743589743589,
770
- "grad_norm": 0.34375,
771
- "learning_rate": 0.0558974358974359,
772
- "loss": 3.5788979530334473,
773
  "step": 218
774
  },
775
  {
776
- "epoch": 0.0056410256410256415,
777
- "grad_norm": 0.392578125,
778
- "learning_rate": 0.05641025641025641,
779
- "loss": 3.523505926132202,
780
  "step": 220
781
  },
782
  {
783
- "epoch": 0.005692307692307693,
784
- "grad_norm": 0.326171875,
785
- "learning_rate": 0.05692307692307693,
786
- "loss": 3.497835874557495,
787
  "step": 222
788
  },
789
  {
790
- "epoch": 0.005743589743589744,
791
- "grad_norm": 0.341796875,
792
- "learning_rate": 0.05743589743589744,
793
- "loss": 3.5063397884368896,
794
  "step": 224
795
  },
796
  {
797
- "epoch": 0.005794871794871795,
798
- "grad_norm": 0.310546875,
799
- "learning_rate": 0.057948717948717955,
800
- "loss": 3.4735443592071533,
801
  "step": 226
802
  },
803
  {
804
- "epoch": 0.005846153846153846,
805
- "grad_norm": 0.32421875,
806
- "learning_rate": 0.05846153846153846,
807
- "loss": 3.536956787109375,
808
  "step": 228
809
  },
810
  {
811
- "epoch": 0.005897435897435898,
812
- "grad_norm": 0.361328125,
813
- "learning_rate": 0.05897435897435897,
814
- "loss": 3.534363031387329,
815
  "step": 230
816
  },
817
  {
818
- "epoch": 0.005948717948717949,
819
- "grad_norm": 0.314453125,
820
- "learning_rate": 0.05948717948717949,
821
- "loss": 3.535642623901367,
822
  "step": 232
823
  },
824
  {
825
- "epoch": 0.006,
826
- "grad_norm": 0.361328125,
827
- "learning_rate": 0.060000000000000005,
828
- "loss": 3.498642921447754,
829
  "step": 234
830
  },
831
  {
832
- "epoch": 0.006051282051282051,
833
- "grad_norm": 0.34765625,
834
- "learning_rate": 0.06051282051282052,
835
- "loss": 3.5290956497192383,
836
  "step": 236
837
  },
838
  {
839
- "epoch": 0.006102564102564103,
840
- "grad_norm": 0.322265625,
841
- "learning_rate": 0.06102564102564103,
842
- "loss": 3.4969096183776855,
843
  "step": 238
844
  },
845
  {
846
- "epoch": 0.006153846153846154,
847
- "grad_norm": 0.31640625,
848
- "learning_rate": 0.06153846153846154,
849
- "loss": 3.4753830432891846,
850
  "step": 240
851
  },
852
  {
853
- "epoch": 0.006205128205128205,
854
- "grad_norm": 0.298828125,
855
- "learning_rate": 0.06205128205128206,
856
- "loss": 3.4777991771698,
857
  "step": 242
858
  },
859
  {
860
- "epoch": 0.006256410256410256,
861
- "grad_norm": 0.28515625,
862
- "learning_rate": 0.06256410256410257,
863
- "loss": 3.4336612224578857,
864
  "step": 244
865
  },
866
  {
867
- "epoch": 0.0063076923076923076,
868
- "grad_norm": 0.37890625,
869
- "learning_rate": 0.06307692307692309,
870
- "loss": 3.4642059803009033,
871
  "step": 246
872
  },
873
  {
874
- "epoch": 0.006358974358974359,
875
- "grad_norm": 0.2890625,
876
- "learning_rate": 0.06358974358974359,
877
- "loss": 3.472360610961914,
878
  "step": 248
879
  },
880
  {
881
- "epoch": 0.00641025641025641,
882
- "grad_norm": 0.2578125,
883
- "learning_rate": 0.0641025641025641,
884
- "loss": 3.4250106811523438,
885
  "step": 250
886
  },
887
  {
888
- "epoch": 0.006461538461538461,
889
- "grad_norm": 0.310546875,
890
- "learning_rate": 0.06461538461538462,
891
- "loss": 3.4243407249450684,
892
  "step": 252
893
  },
894
  {
895
- "epoch": 0.0065128205128205125,
896
- "grad_norm": 0.296875,
897
- "learning_rate": 0.06512820512820514,
898
- "loss": 3.443620204925537,
899
  "step": 254
900
  },
901
  {
902
- "epoch": 0.006564102564102564,
903
- "grad_norm": 0.2578125,
904
- "learning_rate": 0.06564102564102564,
905
- "loss": 3.446272850036621,
906
  "step": 256
907
  },
908
  {
909
- "epoch": 0.006615384615384615,
910
- "grad_norm": 0.30859375,
911
- "learning_rate": 0.06615384615384616,
912
- "loss": 3.446471691131592,
913
  "step": 258
914
  },
915
  {
916
- "epoch": 0.006666666666666667,
917
- "grad_norm": 0.3125,
918
- "learning_rate": 0.06666666666666667,
919
- "loss": 3.4094085693359375,
920
  "step": 260
921
  },
922
  {
923
- "epoch": 0.006717948717948718,
924
- "grad_norm": 0.26171875,
925
- "learning_rate": 0.06717948717948719,
926
- "loss": 3.4011497497558594,
927
  "step": 262
928
  },
929
  {
930
- "epoch": 0.00676923076923077,
931
- "grad_norm": 0.28515625,
932
- "learning_rate": 0.0676923076923077,
933
- "loss": 3.4120538234710693,
934
  "step": 264
935
  },
936
  {
937
- "epoch": 0.006820512820512821,
938
- "grad_norm": 0.287109375,
939
- "learning_rate": 0.06820512820512821,
940
- "loss": 3.3494560718536377,
941
  "step": 266
942
  },
943
  {
944
- "epoch": 0.006871794871794872,
945
- "grad_norm": 0.2470703125,
946
- "learning_rate": 0.06871794871794872,
947
- "loss": 3.3833444118499756,
948
  "step": 268
949
  },
950
  {
951
- "epoch": 0.006923076923076923,
952
- "grad_norm": 0.259765625,
953
- "learning_rate": 0.06923076923076923,
954
- "loss": 3.334336280822754,
955
  "step": 270
956
  },
957
  {
958
- "epoch": 0.0069743589743589745,
959
- "grad_norm": 0.375,
960
- "learning_rate": 0.06974358974358975,
961
- "loss": 3.3835675716400146,
962
  "step": 272
963
  },
964
  {
965
- "epoch": 0.007025641025641026,
966
- "grad_norm": 0.283203125,
967
- "learning_rate": 0.07025641025641026,
968
- "loss": 3.365119695663452,
969
  "step": 274
970
  },
971
  {
972
- "epoch": 0.007076923076923077,
973
- "grad_norm": 0.265625,
974
- "learning_rate": 0.07076923076923078,
975
- "loss": 3.3161237239837646,
976
  "step": 276
977
  },
978
  {
979
- "epoch": 0.007128205128205128,
980
- "grad_norm": 0.2421875,
981
- "learning_rate": 0.07128205128205128,
982
- "loss": 3.3265950679779053,
983
  "step": 278
984
  },
985
  {
986
- "epoch": 0.0071794871794871795,
987
- "grad_norm": 0.267578125,
988
- "learning_rate": 0.07179487179487179,
989
- "loss": 3.3481881618499756,
990
  "step": 280
991
  },
992
  {
993
- "epoch": 0.007230769230769231,
994
- "grad_norm": 0.259765625,
995
- "learning_rate": 0.07230769230769231,
996
- "loss": 3.3163304328918457,
997
  "step": 282
998
  },
999
  {
1000
- "epoch": 0.007282051282051282,
1001
- "grad_norm": 0.26171875,
1002
- "learning_rate": 0.07282051282051283,
1003
- "loss": 3.3111186027526855,
1004
  "step": 284
1005
  },
1006
  {
1007
- "epoch": 0.007333333333333333,
1008
- "grad_norm": 0.2353515625,
1009
- "learning_rate": 0.07333333333333333,
1010
- "loss": 3.2506864070892334,
1011
  "step": 286
1012
  },
1013
  {
1014
- "epoch": 0.0073846153846153844,
1015
- "grad_norm": 0.26171875,
1016
- "learning_rate": 0.07384615384615385,
1017
- "loss": 3.2985129356384277,
1018
  "step": 288
1019
  },
1020
  {
1021
- "epoch": 0.007435897435897436,
1022
- "grad_norm": 0.291015625,
1023
- "learning_rate": 0.07435897435897436,
1024
- "loss": 3.3391776084899902,
1025
  "step": 290
1026
  },
1027
  {
1028
- "epoch": 0.007487179487179487,
1029
- "grad_norm": 0.287109375,
1030
- "learning_rate": 0.07487179487179488,
1031
- "loss": 3.2946319580078125,
1032
  "step": 292
1033
  },
1034
  {
1035
- "epoch": 0.007538461538461538,
1036
- "grad_norm": 0.30859375,
1037
- "learning_rate": 0.07538461538461538,
1038
- "loss": 3.29689359664917,
1039
  "step": 294
1040
  },
1041
  {
1042
- "epoch": 0.007589743589743589,
1043
- "grad_norm": 0.275390625,
1044
- "learning_rate": 0.0758974358974359,
1045
- "loss": 3.2784714698791504,
1046
  "step": 296
1047
  },
1048
  {
1049
- "epoch": 0.007641025641025641,
1050
- "grad_norm": 0.255859375,
1051
- "learning_rate": 0.07641025641025641,
1052
- "loss": 3.3045074939727783,
1053
  "step": 298
1054
  },
1055
  {
1056
- "epoch": 0.007692307692307693,
1057
- "grad_norm": 0.302734375,
1058
- "learning_rate": 0.07692307692307693,
1059
- "loss": 3.2847025394439697,
1060
  "step": 300
1061
  },
1062
  {
1063
- "epoch": 0.007743589743589744,
1064
- "grad_norm": 0.263671875,
1065
- "learning_rate": 0.07743589743589745,
1066
- "loss": 3.288940191268921,
1067
  "step": 302
1068
  },
1069
  {
1070
- "epoch": 0.007794871794871795,
1071
- "grad_norm": 0.267578125,
1072
- "learning_rate": 0.07794871794871795,
1073
- "loss": 3.274775743484497,
1074
  "step": 304
1075
  },
1076
  {
1077
- "epoch": 0.007846153846153846,
1078
- "grad_norm": 0.224609375,
1079
- "learning_rate": 0.07846153846153847,
1080
- "loss": 3.239638566970825,
1081
  "step": 306
1082
  },
1083
  {
1084
- "epoch": 0.007897435897435898,
1085
- "grad_norm": 0.263671875,
1086
- "learning_rate": 0.07897435897435898,
1087
- "loss": 3.236365795135498,
1088
  "step": 308
1089
  },
1090
  {
1091
- "epoch": 0.007948717948717949,
1092
- "grad_norm": 0.2041015625,
1093
- "learning_rate": 0.07948717948717948,
1094
- "loss": 3.226825714111328,
1095
  "step": 310
1096
  },
1097
  {
1098
- "epoch": 0.008,
1099
- "grad_norm": 0.2470703125,
1100
- "learning_rate": 0.08,
1101
- "loss": 3.215003252029419,
1102
  "step": 312
1103
  },
1104
  {
1105
- "epoch": 0.008051282051282051,
1106
- "grad_norm": 0.2236328125,
1107
- "learning_rate": 0.08051282051282052,
1108
- "loss": 3.243821620941162,
1109
  "step": 314
1110
- },
1111
- {
1112
- "epoch": 0.008102564102564103,
1113
- "grad_norm": 0.21484375,
1114
- "learning_rate": 0.08102564102564103,
1115
- "loss": 3.2331736087799072,
1116
- "step": 316
1117
- },
1118
- {
1119
- "epoch": 0.008153846153846154,
1120
- "grad_norm": 0.25390625,
1121
- "learning_rate": 0.08153846153846155,
1122
- "loss": 3.2460896968841553,
1123
- "step": 318
1124
- },
1125
- {
1126
- "epoch": 0.008205128205128205,
1127
- "grad_norm": 0.2138671875,
1128
- "learning_rate": 0.08205128205128205,
1129
- "loss": 3.2442245483398438,
1130
- "step": 320
1131
- },
1132
- {
1133
- "epoch": 0.008256410256410256,
1134
- "grad_norm": 0.2138671875,
1135
- "learning_rate": 0.08256410256410257,
1136
- "loss": 3.226229667663574,
1137
- "step": 322
1138
- },
1139
- {
1140
- "epoch": 0.008307692307692308,
1141
- "grad_norm": 0.20703125,
1142
- "learning_rate": 0.08307692307692308,
1143
- "loss": 3.2243640422821045,
1144
- "step": 324
1145
- },
1146
- {
1147
- "epoch": 0.008358974358974359,
1148
- "grad_norm": 0.2001953125,
1149
- "learning_rate": 0.0835897435897436,
1150
- "loss": 3.196157693862915,
1151
- "step": 326
1152
- },
1153
- {
1154
- "epoch": 0.00841025641025641,
1155
- "grad_norm": 0.22265625,
1156
- "learning_rate": 0.08410256410256411,
1157
- "loss": 3.2026312351226807,
1158
- "step": 328
1159
- },
1160
- {
1161
- "epoch": 0.008461538461538461,
1162
- "grad_norm": 0.2236328125,
1163
- "learning_rate": 0.08461538461538462,
1164
- "loss": 3.2040438652038574,
1165
- "step": 330
1166
- },
1167
- {
1168
- "epoch": 0.008512820512820513,
1169
- "grad_norm": 0.228515625,
1170
- "learning_rate": 0.08512820512820514,
1171
- "loss": 3.2003910541534424,
1172
- "step": 332
1173
- },
1174
- {
1175
- "epoch": 0.008564102564102564,
1176
- "grad_norm": 0.1943359375,
1177
- "learning_rate": 0.08564102564102563,
1178
- "loss": 3.1665427684783936,
1179
- "step": 334
1180
- },
1181
- {
1182
- "epoch": 0.008615384615384615,
1183
- "grad_norm": 0.212890625,
1184
- "learning_rate": 0.08615384615384616,
1185
- "loss": 3.191206693649292,
1186
- "step": 336
1187
- },
1188
- {
1189
- "epoch": 0.008666666666666666,
1190
- "grad_norm": 0.220703125,
1191
- "learning_rate": 0.08666666666666668,
1192
- "loss": 3.2061381340026855,
1193
- "step": 338
1194
- },
1195
- {
1196
- "epoch": 0.008717948717948718,
1197
- "grad_norm": 0.2099609375,
1198
- "learning_rate": 0.08717948717948718,
1199
- "loss": 3.1825222969055176,
1200
- "step": 340
1201
- },
1202
- {
1203
- "epoch": 0.008769230769230769,
1204
- "grad_norm": 0.2255859375,
1205
- "learning_rate": 0.0876923076923077,
1206
- "loss": 3.17889666557312,
1207
- "step": 342
1208
- },
1209
- {
1210
- "epoch": 0.00882051282051282,
1211
- "grad_norm": 0.23828125,
1212
- "learning_rate": 0.0882051282051282,
1213
- "loss": 3.208892822265625,
1214
- "step": 344
1215
- },
1216
- {
1217
- "epoch": 0.008871794871794871,
1218
- "grad_norm": 0.1796875,
1219
- "learning_rate": 0.08871794871794872,
1220
- "loss": 3.174936056137085,
1221
- "step": 346
1222
- },
1223
- {
1224
- "epoch": 0.008923076923076922,
1225
- "grad_norm": 0.228515625,
1226
- "learning_rate": 0.08923076923076924,
1227
- "loss": 3.1907541751861572,
1228
- "step": 348
1229
- },
1230
- {
1231
- "epoch": 0.008974358974358974,
1232
- "grad_norm": 0.2578125,
1233
- "learning_rate": 0.08974358974358974,
1234
- "loss": 3.206651210784912,
1235
- "step": 350
1236
- },
1237
- {
1238
- "epoch": 0.009025641025641025,
1239
- "grad_norm": 0.2333984375,
1240
- "learning_rate": 0.09025641025641026,
1241
- "loss": 3.183749198913574,
1242
- "step": 352
1243
- },
1244
- {
1245
- "epoch": 0.009076923076923076,
1246
- "grad_norm": 0.1943359375,
1247
- "learning_rate": 0.09076923076923077,
1248
- "loss": 3.1806201934814453,
1249
- "step": 354
1250
- },
1251
- {
1252
- "epoch": 0.009128205128205127,
1253
- "grad_norm": 0.1982421875,
1254
- "learning_rate": 0.09128205128205129,
1255
- "loss": 3.1866257190704346,
1256
- "step": 356
1257
- },
1258
- {
1259
- "epoch": 0.009179487179487179,
1260
- "grad_norm": 0.2001953125,
1261
- "learning_rate": 0.09179487179487181,
1262
- "loss": 3.1684730052948,
1263
- "step": 358
1264
- },
1265
- {
1266
- "epoch": 0.009230769230769232,
1267
- "grad_norm": 0.220703125,
1268
- "learning_rate": 0.09230769230769231,
1269
- "loss": 3.1860649585723877,
1270
- "step": 360
1271
- },
1272
- {
1273
- "epoch": 0.009282051282051283,
1274
- "grad_norm": 0.1875,
1275
- "learning_rate": 0.09282051282051283,
1276
- "loss": 3.1316580772399902,
1277
- "step": 362
1278
- },
1279
- {
1280
- "epoch": 0.009333333333333334,
1281
- "grad_norm": 0.251953125,
1282
- "learning_rate": 0.09333333333333332,
1283
- "loss": 3.1661438941955566,
1284
- "step": 364
1285
- },
1286
- {
1287
- "epoch": 0.009384615384615385,
1288
- "grad_norm": 0.1943359375,
1289
- "learning_rate": 0.09384615384615384,
1290
- "loss": 3.165419340133667,
1291
- "step": 366
1292
- },
1293
- {
1294
- "epoch": 0.009435897435897437,
1295
- "grad_norm": 0.17578125,
1296
- "learning_rate": 0.09435897435897438,
1297
- "loss": 3.114865779876709,
1298
- "step": 368
1299
- },
1300
- {
1301
- "epoch": 0.009487179487179488,
1302
- "grad_norm": 0.166015625,
1303
- "learning_rate": 0.09487179487179487,
1304
- "loss": 3.1663386821746826,
1305
- "step": 370
1306
- },
1307
- {
1308
- "epoch": 0.009538461538461539,
1309
- "grad_norm": 0.2001953125,
1310
- "learning_rate": 0.09538461538461539,
1311
- "loss": 3.170686721801758,
1312
- "step": 372
1313
- },
1314
- {
1315
- "epoch": 0.00958974358974359,
1316
- "grad_norm": 0.1611328125,
1317
- "learning_rate": 0.09589743589743589,
1318
- "loss": 3.1436655521392822,
1319
- "step": 374
1320
- },
1321
- {
1322
- "epoch": 0.009641025641025642,
1323
- "grad_norm": 0.181640625,
1324
- "learning_rate": 0.09641025641025641,
1325
- "loss": 3.1797540187835693,
1326
- "step": 376
1327
- },
1328
- {
1329
- "epoch": 0.009692307692307693,
1330
- "grad_norm": 0.197265625,
1331
- "learning_rate": 0.09692307692307693,
1332
- "loss": 3.164923667907715,
1333
- "step": 378
1334
- },
1335
- {
1336
- "epoch": 0.009743589743589744,
1337
- "grad_norm": 0.2041015625,
1338
- "learning_rate": 0.09743589743589744,
1339
- "loss": 3.1701009273529053,
1340
- "step": 380
1341
- },
1342
- {
1343
- "epoch": 0.009794871794871795,
1344
- "grad_norm": 0.1513671875,
1345
- "learning_rate": 0.09794871794871796,
1346
- "loss": 3.1355717182159424,
1347
- "step": 382
1348
- },
1349
- {
1350
- "epoch": 0.009846153846153846,
1351
- "grad_norm": 0.1552734375,
1352
- "learning_rate": 0.09846153846153848,
1353
- "loss": 3.1020851135253906,
1354
- "step": 384
1355
- },
1356
- {
1357
- "epoch": 0.009897435897435898,
1358
- "grad_norm": 0.1689453125,
1359
- "learning_rate": 0.09897435897435898,
1360
- "loss": 3.146981954574585,
1361
- "step": 386
1362
- },
1363
- {
1364
- "epoch": 0.009948717948717949,
1365
- "grad_norm": 0.201171875,
1366
- "learning_rate": 0.0994871794871795,
1367
- "loss": 3.1239013671875,
1368
- "step": 388
1369
- },
1370
- {
1371
- "epoch": 0.01,
1372
- "grad_norm": 0.228515625,
1373
- "learning_rate": 0.1,
1374
- "loss": 3.0975100994110107,
1375
- "step": 390
1376
  }
1377
  ],
1378
  "logging_steps": 2,
1379
- "max_steps": 39000,
1380
  "num_input_tokens_seen": 0,
1381
  "num_train_epochs": 9223372036854775807,
1382
- "save_steps": 390,
1383
  "stateful_callbacks": {
1384
  "TrainerControl": {
1385
  "args": {
@@ -1392,7 +1126,7 @@
1392
  "attributes": {}
1393
  }
1394
  },
1395
- "total_flos": 9.851886071221248e+17,
1396
  "train_batch_size": 4,
1397
  "trial_name": null,
1398
  "trial_params": null
 
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
  "epoch": 0.01,
6
+ "eval_steps": 3150,
7
+ "global_step": 315,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
+ "epoch": 6.349206349206349e-05,
14
+ "grad_norm": 6.625,
15
+ "learning_rate": 0.0006349206349206349,
16
+ "loss": 10.801105499267578,
17
  "step": 2
18
  },
19
  {
20
+ "epoch": 0.00012698412698412698,
21
+ "grad_norm": 7.09375,
22
+ "learning_rate": 0.0012698412698412698,
23
+ "loss": 9.326807975769043,
24
  "step": 4
25
  },
26
  {
27
+ "epoch": 0.00019047619047619048,
28
+ "grad_norm": 3.890625,
29
+ "learning_rate": 0.001904761904761905,
30
+ "loss": 7.773923397064209,
31
  "step": 6
32
  },
33
  {
34
+ "epoch": 0.00025396825396825396,
35
+ "grad_norm": 6.96875,
36
+ "learning_rate": 0.0025396825396825397,
37
+ "loss": 7.479777812957764,
38
  "step": 8
39
  },
40
  {
41
+ "epoch": 0.00031746031746031746,
42
+ "grad_norm": 5.96875,
43
+ "learning_rate": 0.0031746031746031746,
44
+ "loss": 7.3737945556640625,
45
  "step": 10
46
  },
47
  {
48
+ "epoch": 0.00038095238095238096,
49
+ "grad_norm": 3.390625,
50
+ "learning_rate": 0.00380952380952381,
51
+ "loss": 7.2390546798706055,
52
  "step": 12
53
  },
54
  {
55
+ "epoch": 0.00044444444444444447,
56
+ "grad_norm": 3.125,
57
+ "learning_rate": 0.0044444444444444444,
58
+ "loss": 7.201446533203125,
59
  "step": 14
60
  },
61
  {
62
+ "epoch": 0.0005079365079365079,
63
+ "grad_norm": 3.046875,
64
+ "learning_rate": 0.005079365079365079,
65
+ "loss": 7.195759296417236,
66
  "step": 16
67
  },
68
  {
69
+ "epoch": 0.0005714285714285715,
70
+ "grad_norm": 2.703125,
71
+ "learning_rate": 0.005714285714285714,
72
+ "loss": 7.20925760269165,
73
  "step": 18
74
  },
75
  {
76
+ "epoch": 0.0006349206349206349,
77
+ "grad_norm": 3.875,
78
+ "learning_rate": 0.006349206349206349,
79
+ "loss": 7.200610160827637,
80
  "step": 20
81
  },
82
  {
83
+ "epoch": 0.0006984126984126984,
84
+ "grad_norm": 3.53125,
85
+ "learning_rate": 0.006984126984126985,
86
+ "loss": 7.15569543838501,
87
  "step": 22
88
  },
89
  {
90
+ "epoch": 0.0007619047619047619,
91
+ "grad_norm": 3.53125,
92
+ "learning_rate": 0.00761904761904762,
93
+ "loss": 7.171877384185791,
94
  "step": 24
95
  },
96
  {
97
+ "epoch": 0.0008253968253968254,
98
+ "grad_norm": 3.546875,
99
+ "learning_rate": 0.008253968253968255,
100
+ "loss": 7.162521839141846,
101
  "step": 26
102
  },
103
  {
104
+ "epoch": 0.0008888888888888889,
105
+ "grad_norm": 4.0625,
106
+ "learning_rate": 0.008888888888888889,
107
+ "loss": 7.177415370941162,
108
  "step": 28
109
  },
110
  {
111
+ "epoch": 0.0009523809523809524,
112
+ "grad_norm": 3.375,
113
+ "learning_rate": 0.009523809523809525,
114
+ "loss": 7.142434120178223,
115
  "step": 30
116
  },
117
  {
118
+ "epoch": 0.0010158730158730158,
119
+ "grad_norm": 4.03125,
120
+ "learning_rate": 0.010158730158730159,
121
+ "loss": 7.162986755371094,
122
  "step": 32
123
  },
124
  {
125
+ "epoch": 0.0010793650793650793,
126
+ "grad_norm": 5.53125,
127
+ "learning_rate": 0.010793650793650795,
128
+ "loss": 7.125688552856445,
129
  "step": 34
130
  },
131
  {
132
+ "epoch": 0.001142857142857143,
133
+ "grad_norm": 3.90625,
134
+ "learning_rate": 0.011428571428571429,
135
+ "loss": 7.064617156982422,
136
  "step": 36
137
  },
138
  {
139
+ "epoch": 0.0012063492063492064,
140
+ "grad_norm": 4.0,
141
+ "learning_rate": 0.012063492063492064,
142
+ "loss": 7.0018086433410645,
143
  "step": 38
144
  },
145
  {
146
+ "epoch": 0.0012698412698412698,
147
+ "grad_norm": 4.78125,
148
+ "learning_rate": 0.012698412698412698,
149
+ "loss": 6.9951910972595215,
150
  "step": 40
151
  },
152
  {
153
+ "epoch": 0.0013333333333333333,
154
+ "grad_norm": 4.34375,
155
+ "learning_rate": 0.013333333333333334,
156
+ "loss": 6.8632588386535645,
157
  "step": 42
158
  },
159
  {
160
+ "epoch": 0.0013968253968253967,
161
+ "grad_norm": 4.5625,
162
+ "learning_rate": 0.01396825396825397,
163
+ "loss": 6.8031721115112305,
164
  "step": 44
165
  },
166
  {
167
+ "epoch": 0.0014603174603174604,
168
+ "grad_norm": 5.90625,
169
+ "learning_rate": 0.014603174603174604,
170
+ "loss": 6.659753322601318,
171
  "step": 46
172
  },
173
  {
174
+ "epoch": 0.0015238095238095239,
175
+ "grad_norm": 5.3125,
176
+ "learning_rate": 0.01523809523809524,
177
+ "loss": 6.541396141052246,
178
  "step": 48
179
  },
180
  {
181
+ "epoch": 0.0015873015873015873,
182
+ "grad_norm": 7.375,
183
+ "learning_rate": 0.015873015873015872,
184
+ "loss": 6.320700645446777,
185
  "step": 50
186
  },
187
  {
188
+ "epoch": 0.0016507936507936507,
189
+ "grad_norm": 7.03125,
190
+ "learning_rate": 0.01650793650793651,
191
+ "loss": 6.180545806884766,
192
  "step": 52
193
  },
194
  {
195
+ "epoch": 0.0017142857142857142,
196
+ "grad_norm": 9.5,
197
+ "learning_rate": 0.017142857142857144,
198
+ "loss": 6.006712436676025,
199
  "step": 54
200
  },
201
  {
202
+ "epoch": 0.0017777777777777779,
203
+ "grad_norm": 5.5625,
204
+ "learning_rate": 0.017777777777777778,
205
+ "loss": 5.814790725708008,
206
  "step": 56
207
  },
208
  {
209
+ "epoch": 0.0018412698412698413,
210
+ "grad_norm": 7.71875,
211
+ "learning_rate": 0.018412698412698415,
212
+ "loss": 5.85807991027832,
213
  "step": 58
214
  },
215
  {
216
+ "epoch": 0.0019047619047619048,
217
+ "grad_norm": 11.0,
218
+ "learning_rate": 0.01904761904761905,
219
+ "loss": 5.783743858337402,
220
  "step": 60
221
  },
222
  {
223
+ "epoch": 0.0019682539682539684,
224
+ "grad_norm": 6.21875,
225
+ "learning_rate": 0.019682539682539683,
226
+ "loss": 5.803546905517578,
227
  "step": 62
228
  },
229
  {
230
+ "epoch": 0.0020317460317460317,
231
+ "grad_norm": 9.875,
232
+ "learning_rate": 0.020317460317460317,
233
+ "loss": 5.761871337890625,
234
  "step": 64
235
  },
236
  {
237
+ "epoch": 0.0020952380952380953,
238
+ "grad_norm": 9.0,
239
+ "learning_rate": 0.020952380952380955,
240
+ "loss": 5.712563991546631,
241
  "step": 66
242
  },
243
  {
244
+ "epoch": 0.0021587301587301586,
245
+ "grad_norm": 8.5,
246
+ "learning_rate": 0.02158730158730159,
247
+ "loss": 5.822197914123535,
248
  "step": 68
249
  },
250
  {
251
+ "epoch": 0.0022222222222222222,
252
+ "grad_norm": 5.3125,
253
+ "learning_rate": 0.022222222222222223,
254
+ "loss": 5.670584678649902,
255
  "step": 70
256
  },
257
  {
258
+ "epoch": 0.002285714285714286,
259
+ "grad_norm": 6.90625,
260
+ "learning_rate": 0.022857142857142857,
261
+ "loss": 5.861469745635986,
262
  "step": 72
263
  },
264
  {
265
+ "epoch": 0.002349206349206349,
266
+ "grad_norm": 7.90625,
267
+ "learning_rate": 0.023492063492063495,
268
+ "loss": 5.852883815765381,
269
  "step": 74
270
  },
271
  {
272
+ "epoch": 0.0024126984126984128,
273
+ "grad_norm": 8.25,
274
+ "learning_rate": 0.02412698412698413,
275
+ "loss": 6.089724540710449,
276
  "step": 76
277
  },
278
  {
279
+ "epoch": 0.002476190476190476,
280
+ "grad_norm": 11.75,
281
+ "learning_rate": 0.024761904761904763,
282
+ "loss": 5.999917030334473,
283
  "step": 78
284
  },
285
  {
286
+ "epoch": 0.0025396825396825397,
287
+ "grad_norm": 11.4375,
288
+ "learning_rate": 0.025396825396825397,
289
+ "loss": 6.174747467041016,
290
  "step": 80
291
  },
292
  {
293
+ "epoch": 0.0026031746031746033,
294
+ "grad_norm": 8.3125,
295
+ "learning_rate": 0.026031746031746034,
296
+ "loss": 6.123311519622803,
297
  "step": 82
298
  },
299
  {
300
+ "epoch": 0.0026666666666666666,
301
+ "grad_norm": 12.1875,
302
+ "learning_rate": 0.02666666666666667,
303
+ "loss": 6.0668158531188965,
304
  "step": 84
305
  },
306
  {
307
+ "epoch": 0.0027301587301587302,
308
+ "grad_norm": 6.75,
309
+ "learning_rate": 0.0273015873015873,
310
+ "loss": 6.131885051727295,
311
  "step": 86
312
  },
313
  {
314
+ "epoch": 0.0027936507936507935,
315
+ "grad_norm": 6.65625,
316
+ "learning_rate": 0.02793650793650794,
317
+ "loss": 6.160358428955078,
318
  "step": 88
319
  },
320
  {
321
+ "epoch": 0.002857142857142857,
322
+ "grad_norm": 9.3125,
323
+ "learning_rate": 0.02857142857142857,
324
+ "loss": 6.3066277503967285,
325
  "step": 90
326
  },
327
  {
328
+ "epoch": 0.002920634920634921,
329
+ "grad_norm": 5.4375,
330
+ "learning_rate": 0.029206349206349208,
331
+ "loss": 6.316789627075195,
332
  "step": 92
333
  },
334
  {
335
+ "epoch": 0.002984126984126984,
336
+ "grad_norm": 6.59375,
337
+ "learning_rate": 0.029841269841269842,
338
+ "loss": 6.33724308013916,
339
  "step": 94
340
  },
341
  {
342
+ "epoch": 0.0030476190476190477,
343
+ "grad_norm": 6.5,
344
+ "learning_rate": 0.03047619047619048,
345
+ "loss": 6.288860321044922,
346
  "step": 96
347
  },
348
  {
349
+ "epoch": 0.003111111111111111,
350
+ "grad_norm": 8.6875,
351
+ "learning_rate": 0.031111111111111114,
352
+ "loss": 6.362759113311768,
353
  "step": 98
354
  },
355
  {
356
+ "epoch": 0.0031746031746031746,
357
+ "grad_norm": 5.1875,
358
+ "learning_rate": 0.031746031746031744,
359
+ "loss": 6.259101390838623,
360
  "step": 100
361
  },
362
  {
363
+ "epoch": 0.0032380952380952383,
364
+ "grad_norm": 4.0,
365
+ "learning_rate": 0.032380952380952385,
366
+ "loss": 6.47907829284668,
367
  "step": 102
368
  },
369
  {
370
+ "epoch": 0.0033015873015873015,
371
+ "grad_norm": 5.28125,
372
+ "learning_rate": 0.03301587301587302,
373
+ "loss": 6.57755184173584,
374
  "step": 104
375
  },
376
  {
377
+ "epoch": 0.003365079365079365,
378
+ "grad_norm": 5.59375,
379
+ "learning_rate": 0.03365079365079365,
380
+ "loss": 6.404579162597656,
381
  "step": 106
382
  },
383
  {
384
+ "epoch": 0.0034285714285714284,
385
+ "grad_norm": 5.40625,
386
+ "learning_rate": 0.03428571428571429,
387
+ "loss": 6.36335563659668,
388
  "step": 108
389
  },
390
  {
391
+ "epoch": 0.003492063492063492,
392
+ "grad_norm": 5.8125,
393
+ "learning_rate": 0.03492063492063492,
394
+ "loss": 6.326794147491455,
395
  "step": 110
396
  },
397
  {
398
+ "epoch": 0.0035555555555555557,
399
+ "grad_norm": 5.34375,
400
+ "learning_rate": 0.035555555555555556,
401
+ "loss": 6.243236541748047,
402
  "step": 112
403
  },
404
  {
405
+ "epoch": 0.003619047619047619,
406
+ "grad_norm": 4.71875,
407
+ "learning_rate": 0.03619047619047619,
408
+ "loss": 6.32989501953125,
409
  "step": 114
410
  },
411
  {
412
+ "epoch": 0.0036825396825396826,
413
+ "grad_norm": 5.21875,
414
+ "learning_rate": 0.03682539682539683,
415
+ "loss": 6.213305950164795,
416
  "step": 116
417
  },
418
  {
419
+ "epoch": 0.003746031746031746,
420
+ "grad_norm": 4.6875,
421
+ "learning_rate": 0.037460317460317465,
422
+ "loss": 6.210652828216553,
423
  "step": 118
424
  },
425
  {
426
+ "epoch": 0.0038095238095238095,
427
+ "grad_norm": 3.890625,
428
+ "learning_rate": 0.0380952380952381,
429
+ "loss": 5.987586975097656,
430
  "step": 120
431
  },
432
  {
433
+ "epoch": 0.003873015873015873,
434
+ "grad_norm": 4.1875,
435
+ "learning_rate": 0.03873015873015873,
436
+ "loss": 5.850035190582275,
437
  "step": 122
438
  },
439
  {
440
+ "epoch": 0.003936507936507937,
441
+ "grad_norm": 3.609375,
442
+ "learning_rate": 0.03936507936507937,
443
+ "loss": 5.705539703369141,
444
  "step": 124
445
  },
446
  {
447
+ "epoch": 0.004,
448
+ "grad_norm": 3.984375,
449
+ "learning_rate": 0.04000000000000001,
450
+ "loss": 5.706523418426514,
451
  "step": 126
452
  },
453
  {
454
+ "epoch": 0.004063492063492063,
455
+ "grad_norm": 4.15625,
456
+ "learning_rate": 0.040634920634920635,
457
+ "loss": 5.558238983154297,
458
  "step": 128
459
  },
460
  {
461
+ "epoch": 0.004126984126984127,
462
+ "grad_norm": 3.96875,
463
+ "learning_rate": 0.04126984126984127,
464
+ "loss": 5.4358367919921875,
465
  "step": 130
466
  },
467
  {
468
+ "epoch": 0.004190476190476191,
469
+ "grad_norm": 3.015625,
470
+ "learning_rate": 0.04190476190476191,
471
+ "loss": 5.235808372497559,
472
  "step": 132
473
  },
474
  {
475
+ "epoch": 0.004253968253968254,
476
+ "grad_norm": 3.40625,
477
+ "learning_rate": 0.042539682539682544,
478
+ "loss": 5.232395172119141,
479
  "step": 134
480
  },
481
  {
482
+ "epoch": 0.004317460317460317,
483
+ "grad_norm": 3.78125,
484
+ "learning_rate": 0.04317460317460318,
485
+ "loss": 5.167571067810059,
486
  "step": 136
487
  },
488
  {
489
+ "epoch": 0.004380952380952381,
490
+ "grad_norm": 6.21875,
491
+ "learning_rate": 0.04380952380952381,
492
+ "loss": 5.139188289642334,
493
  "step": 138
494
  },
495
  {
496
+ "epoch": 0.0044444444444444444,
497
+ "grad_norm": 4.28125,
498
+ "learning_rate": 0.044444444444444446,
499
+ "loss": 5.103665351867676,
500
  "step": 140
501
  },
502
  {
503
+ "epoch": 0.004507936507936508,
504
+ "grad_norm": 2.9375,
505
+ "learning_rate": 0.04507936507936508,
506
+ "loss": 5.074988842010498,
507
  "step": 142
508
  },
509
  {
510
+ "epoch": 0.004571428571428572,
511
+ "grad_norm": 2.59375,
512
+ "learning_rate": 0.045714285714285714,
513
+ "loss": 4.910512924194336,
514
  "step": 144
515
  },
516
  {
517
+ "epoch": 0.004634920634920635,
518
+ "grad_norm": 2.96875,
519
+ "learning_rate": 0.046349206349206355,
520
+ "loss": 4.994100093841553,
521
  "step": 146
522
  },
523
  {
524
+ "epoch": 0.004698412698412698,
525
+ "grad_norm": 2.71875,
526
+ "learning_rate": 0.04698412698412699,
527
+ "loss": 4.926704406738281,
528
  "step": 148
529
  },
530
  {
531
+ "epoch": 0.004761904761904762,
532
+ "grad_norm": 2.90625,
533
+ "learning_rate": 0.047619047619047616,
534
+ "loss": 4.945565223693848,
535
  "step": 150
536
  },
537
  {
538
+ "epoch": 0.0048253968253968256,
539
+ "grad_norm": 3.140625,
540
+ "learning_rate": 0.04825396825396826,
541
+ "loss": 4.820583343505859,
542
  "step": 152
543
  },
544
  {
545
+ "epoch": 0.004888888888888889,
546
+ "grad_norm": 2.375,
547
+ "learning_rate": 0.04888888888888889,
548
+ "loss": 4.817602634429932,
549
  "step": 154
550
  },
551
  {
552
+ "epoch": 0.004952380952380952,
553
+ "grad_norm": 2.890625,
554
+ "learning_rate": 0.049523809523809526,
555
+ "loss": 4.858508110046387,
556
  "step": 156
557
  },
558
  {
559
+ "epoch": 0.005015873015873016,
560
+ "grad_norm": 3.09375,
561
+ "learning_rate": 0.05015873015873016,
562
+ "loss": 4.83630895614624,
563
  "step": 158
564
  },
565
  {
566
+ "epoch": 0.005079365079365079,
567
+ "grad_norm": 3.171875,
568
+ "learning_rate": 0.050793650793650794,
569
+ "loss": 4.845445156097412,
570
  "step": 160
571
  },
572
  {
573
+ "epoch": 0.005142857142857143,
574
+ "grad_norm": 2.671875,
575
+ "learning_rate": 0.05142857142857143,
576
+ "loss": 4.703234672546387,
577
  "step": 162
578
  },
579
  {
580
+ "epoch": 0.005206349206349207,
581
+ "grad_norm": 2.21875,
582
+ "learning_rate": 0.05206349206349207,
583
+ "loss": 4.716393947601318,
584
  "step": 164
585
  },
586
  {
587
+ "epoch": 0.00526984126984127,
588
+ "grad_norm": 1.9921875,
589
+ "learning_rate": 0.0526984126984127,
590
+ "loss": 4.729320049285889,
591
  "step": 166
592
  },
593
  {
594
+ "epoch": 0.005333333333333333,
595
+ "grad_norm": 2.296875,
596
+ "learning_rate": 0.05333333333333334,
597
+ "loss": 4.728988170623779,
598
  "step": 168
599
  },
600
  {
601
+ "epoch": 0.005396825396825397,
602
+ "grad_norm": 2.015625,
603
+ "learning_rate": 0.05396825396825397,
604
+ "loss": 4.712806701660156,
605
  "step": 170
606
  },
607
  {
608
+ "epoch": 0.0054603174603174605,
609
+ "grad_norm": 2.1875,
610
+ "learning_rate": 0.0546031746031746,
611
+ "loss": 4.607054710388184,
612
  "step": 172
613
  },
614
  {
615
+ "epoch": 0.005523809523809524,
616
+ "grad_norm": 1.90625,
617
+ "learning_rate": 0.055238095238095246,
618
+ "loss": 4.64877462387085,
619
  "step": 174
620
  },
621
  {
622
+ "epoch": 0.005587301587301587,
623
+ "grad_norm": 1.8515625,
624
+ "learning_rate": 0.05587301587301588,
625
+ "loss": 4.659054279327393,
626
  "step": 176
627
  },
628
  {
629
+ "epoch": 0.005650793650793651,
630
+ "grad_norm": 2.046875,
631
+ "learning_rate": 0.05650793650793651,
632
+ "loss": 4.607472896575928,
633
  "step": 178
634
  },
635
  {
636
+ "epoch": 0.005714285714285714,
637
+ "grad_norm": 3.015625,
638
+ "learning_rate": 0.05714285714285714,
639
+ "loss": 4.644662380218506,
640
  "step": 180
641
  },
642
  {
643
+ "epoch": 0.0057777777777777775,
644
+ "grad_norm": 2.125,
645
+ "learning_rate": 0.057777777777777775,
646
+ "loss": 4.561500549316406,
647
  "step": 182
648
  },
649
  {
650
+ "epoch": 0.005841269841269842,
651
+ "grad_norm": 1.9296875,
652
+ "learning_rate": 0.058412698412698416,
653
+ "loss": 4.61305570602417,
654
  "step": 184
655
  },
656
  {
657
+ "epoch": 0.005904761904761905,
658
+ "grad_norm": 2.0,
659
+ "learning_rate": 0.05904761904761905,
660
+ "loss": 4.505429744720459,
661
  "step": 186
662
  },
663
  {
664
+ "epoch": 0.005968253968253968,
665
+ "grad_norm": 1.796875,
666
+ "learning_rate": 0.059682539682539684,
667
+ "loss": 4.505371570587158,
668
  "step": 188
669
  },
670
  {
671
+ "epoch": 0.006031746031746032,
672
+ "grad_norm": 1.5859375,
673
+ "learning_rate": 0.06031746031746032,
674
+ "loss": 4.484126091003418,
675
  "step": 190
676
  },
677
  {
678
+ "epoch": 0.006095238095238095,
679
+ "grad_norm": 1.796875,
680
+ "learning_rate": 0.06095238095238096,
681
+ "loss": 4.488917350769043,
682
  "step": 192
683
  },
684
  {
685
+ "epoch": 0.006158730158730159,
686
+ "grad_norm": 2.0625,
687
+ "learning_rate": 0.06158730158730159,
688
+ "loss": 4.548356533050537,
689
  "step": 194
690
  },
691
  {
692
+ "epoch": 0.006222222222222222,
693
+ "grad_norm": 1.7578125,
694
+ "learning_rate": 0.06222222222222223,
695
+ "loss": 4.44257926940918,
696
  "step": 196
697
  },
698
  {
699
+ "epoch": 0.006285714285714286,
700
+ "grad_norm": 1.7890625,
701
+ "learning_rate": 0.06285714285714286,
702
+ "loss": 4.4452056884765625,
703
  "step": 198
704
  },
705
  {
706
+ "epoch": 0.006349206349206349,
707
+ "grad_norm": 1.8515625,
708
+ "learning_rate": 0.06349206349206349,
709
+ "loss": 4.5187506675720215,
710
  "step": 200
711
  },
712
  {
713
+ "epoch": 0.006412698412698412,
714
+ "grad_norm": 1.7265625,
715
+ "learning_rate": 0.06412698412698413,
716
+ "loss": 4.399511814117432,
717
  "step": 202
718
  },
719
  {
720
+ "epoch": 0.0064761904761904765,
721
+ "grad_norm": 1.703125,
722
+ "learning_rate": 0.06476190476190477,
723
+ "loss": 4.358022212982178,
724
  "step": 204
725
  },
726
  {
727
+ "epoch": 0.00653968253968254,
728
+ "grad_norm": 1.671875,
729
+ "learning_rate": 0.0653968253968254,
730
+ "loss": 4.394007205963135,
731
  "step": 206
732
  },
733
  {
734
+ "epoch": 0.006603174603174603,
735
+ "grad_norm": 1.59375,
736
+ "learning_rate": 0.06603174603174604,
737
+ "loss": 4.378864765167236,
738
  "step": 208
739
  },
740
  {
741
+ "epoch": 0.006666666666666667,
742
+ "grad_norm": 1.578125,
743
+ "learning_rate": 0.06666666666666667,
744
+ "loss": 4.373222827911377,
745
  "step": 210
746
  },
747
  {
748
+ "epoch": 0.00673015873015873,
749
+ "grad_norm": 1.390625,
750
+ "learning_rate": 0.0673015873015873,
751
+ "loss": 4.297969341278076,
752
  "step": 212
753
  },
754
  {
755
+ "epoch": 0.0067936507936507936,
756
+ "grad_norm": 1.578125,
757
+ "learning_rate": 0.06793650793650795,
758
+ "loss": 4.358753204345703,
759
  "step": 214
760
  },
761
  {
762
+ "epoch": 0.006857142857142857,
763
+ "grad_norm": 2.125,
764
+ "learning_rate": 0.06857142857142857,
765
+ "loss": 4.382944107055664,
766
  "step": 216
767
  },
768
  {
769
+ "epoch": 0.006920634920634921,
770
+ "grad_norm": 1.7421875,
771
+ "learning_rate": 0.0692063492063492,
772
+ "loss": 4.358743667602539,
773
  "step": 218
774
  },
775
  {
776
+ "epoch": 0.006984126984126984,
777
+ "grad_norm": 1.9375,
778
+ "learning_rate": 0.06984126984126984,
779
+ "loss": 4.28198766708374,
780
  "step": 220
781
  },
782
  {
783
+ "epoch": 0.007047619047619047,
784
+ "grad_norm": 1.90625,
785
+ "learning_rate": 0.07047619047619048,
786
+ "loss": 4.325778007507324,
787
  "step": 222
788
  },
789
  {
790
+ "epoch": 0.0071111111111111115,
791
+ "grad_norm": 1.5703125,
792
+ "learning_rate": 0.07111111111111111,
793
+ "loss": 4.283350467681885,
794
  "step": 224
795
  },
796
  {
797
+ "epoch": 0.007174603174603175,
798
+ "grad_norm": 1.875,
799
+ "learning_rate": 0.07174603174603175,
800
+ "loss": 4.292675971984863,
801
  "step": 226
802
  },
803
  {
804
+ "epoch": 0.007238095238095238,
805
+ "grad_norm": 1.5078125,
806
+ "learning_rate": 0.07238095238095238,
807
+ "loss": 4.210683345794678,
808
  "step": 228
809
  },
810
  {
811
+ "epoch": 0.007301587301587302,
812
+ "grad_norm": 1.4296875,
813
+ "learning_rate": 0.07301587301587302,
814
+ "loss": 4.2952704429626465,
815
  "step": 230
816
  },
817
  {
818
+ "epoch": 0.007365079365079365,
819
+ "grad_norm": 1.75,
820
+ "learning_rate": 0.07365079365079366,
821
+ "loss": 4.2953972816467285,
822
  "step": 232
823
  },
824
  {
825
+ "epoch": 0.0074285714285714285,
826
+ "grad_norm": 1.6484375,
827
+ "learning_rate": 0.07428571428571429,
828
+ "loss": 4.21522331237793,
829
  "step": 234
830
  },
831
  {
832
+ "epoch": 0.007492063492063492,
833
+ "grad_norm": 1.5703125,
834
+ "learning_rate": 0.07492063492063493,
835
+ "loss": 4.231412410736084,
836
  "step": 236
837
  },
838
  {
839
+ "epoch": 0.007555555555555556,
840
+ "grad_norm": 1.6484375,
841
+ "learning_rate": 0.07555555555555556,
842
+ "loss": 4.215019226074219,
843
  "step": 238
844
  },
845
  {
846
+ "epoch": 0.007619047619047619,
847
+ "grad_norm": 1.703125,
848
+ "learning_rate": 0.0761904761904762,
849
+ "loss": 4.229800701141357,
850
  "step": 240
851
  },
852
  {
853
+ "epoch": 0.007682539682539682,
854
+ "grad_norm": 1.2109375,
855
+ "learning_rate": 0.07682539682539684,
856
+ "loss": 4.152937412261963,
857
  "step": 242
858
  },
859
  {
860
+ "epoch": 0.007746031746031746,
861
+ "grad_norm": 1.3203125,
862
+ "learning_rate": 0.07746031746031747,
863
+ "loss": 4.1424665451049805,
864
  "step": 244
865
  },
866
  {
867
+ "epoch": 0.00780952380952381,
868
+ "grad_norm": 1.5234375,
869
+ "learning_rate": 0.0780952380952381,
870
+ "loss": 4.163131237030029,
871
  "step": 246
872
  },
873
  {
874
+ "epoch": 0.007873015873015874,
875
+ "grad_norm": 1.5078125,
876
+ "learning_rate": 0.07873015873015873,
877
+ "loss": 4.1024556159973145,
878
  "step": 248
879
  },
880
  {
881
+ "epoch": 0.007936507936507936,
882
+ "grad_norm": 1.2734375,
883
+ "learning_rate": 0.07936507936507936,
884
+ "loss": 4.060139179229736,
885
  "step": 250
886
  },
887
  {
888
+ "epoch": 0.008,
889
+ "grad_norm": 1.265625,
890
+ "learning_rate": 0.08000000000000002,
891
+ "loss": 4.058903217315674,
892
  "step": 252
893
  },
894
  {
895
+ "epoch": 0.008063492063492064,
896
+ "grad_norm": 1.2421875,
897
+ "learning_rate": 0.08063492063492064,
898
+ "loss": 4.025557994842529,
899
  "step": 254
900
  },
901
  {
902
+ "epoch": 0.008126984126984127,
903
+ "grad_norm": 1.375,
904
+ "learning_rate": 0.08126984126984127,
905
+ "loss": 3.9608795642852783,
906
  "step": 256
907
  },
908
  {
909
+ "epoch": 0.00819047619047619,
910
+ "grad_norm": 1.6875,
911
+ "learning_rate": 0.08190476190476191,
912
+ "loss": 3.9889020919799805,
913
  "step": 258
914
  },
915
  {
916
+ "epoch": 0.008253968253968255,
917
+ "grad_norm": 1.6171875,
918
+ "learning_rate": 0.08253968253968254,
919
+ "loss": 3.962678909301758,
920
  "step": 260
921
  },
922
  {
923
+ "epoch": 0.008317460317460317,
924
+ "grad_norm": 1.4375,
925
+ "learning_rate": 0.08317460317460318,
926
+ "loss": 3.89566707611084,
927
  "step": 262
928
  },
929
  {
930
+ "epoch": 0.008380952380952381,
931
+ "grad_norm": 1.3203125,
932
+ "learning_rate": 0.08380952380952382,
933
+ "loss": 3.938316583633423,
934
  "step": 264
935
  },
936
  {
937
+ "epoch": 0.008444444444444444,
938
+ "grad_norm": 1.0859375,
939
+ "learning_rate": 0.08444444444444445,
940
+ "loss": 3.9036355018615723,
941
  "step": 266
942
  },
943
  {
944
+ "epoch": 0.008507936507936508,
945
+ "grad_norm": 1.4609375,
946
+ "learning_rate": 0.08507936507936509,
947
+ "loss": 3.845884084701538,
948
  "step": 268
949
  },
950
  {
951
+ "epoch": 0.008571428571428572,
952
+ "grad_norm": 1.078125,
953
+ "learning_rate": 0.08571428571428572,
954
+ "loss": 3.865518569946289,
955
  "step": 270
956
  },
957
  {
958
+ "epoch": 0.008634920634920634,
959
+ "grad_norm": 1.265625,
960
+ "learning_rate": 0.08634920634920636,
961
+ "loss": 3.879326105117798,
962
  "step": 272
963
  },
964
  {
965
+ "epoch": 0.008698412698412698,
966
+ "grad_norm": 1.4140625,
967
+ "learning_rate": 0.086984126984127,
968
+ "loss": 3.819279193878174,
969
  "step": 274
970
  },
971
  {
972
+ "epoch": 0.008761904761904762,
973
+ "grad_norm": 1.7734375,
974
+ "learning_rate": 0.08761904761904762,
975
+ "loss": 3.8500442504882812,
976
  "step": 276
977
  },
978
  {
979
+ "epoch": 0.008825396825396825,
980
+ "grad_norm": 1.6484375,
981
+ "learning_rate": 0.08825396825396825,
982
+ "loss": 3.7705399990081787,
983
  "step": 278
984
  },
985
  {
986
+ "epoch": 0.008888888888888889,
987
+ "grad_norm": 1.125,
988
+ "learning_rate": 0.08888888888888889,
989
+ "loss": 3.777470111846924,
990
  "step": 280
991
  },
992
  {
993
+ "epoch": 0.008952380952380953,
994
+ "grad_norm": 1.03125,
995
+ "learning_rate": 0.08952380952380953,
996
+ "loss": 3.7298450469970703,
997
  "step": 282
998
  },
999
  {
1000
+ "epoch": 0.009015873015873015,
1001
+ "grad_norm": 1.046875,
1002
+ "learning_rate": 0.09015873015873016,
1003
+ "loss": 3.794740915298462,
1004
  "step": 284
1005
  },
1006
  {
1007
+ "epoch": 0.00907936507936508,
1008
+ "grad_norm": 0.97265625,
1009
+ "learning_rate": 0.0907936507936508,
1010
+ "loss": 3.737441062927246,
1011
  "step": 286
1012
  },
1013
  {
1014
+ "epoch": 0.009142857142857144,
1015
+ "grad_norm": 1.1640625,
1016
+ "learning_rate": 0.09142857142857143,
1017
+ "loss": 3.7325448989868164,
1018
  "step": 288
1019
  },
1020
  {
1021
+ "epoch": 0.009206349206349206,
1022
+ "grad_norm": 1.265625,
1023
+ "learning_rate": 0.09206349206349207,
1024
+ "loss": 3.7607827186584473,
1025
  "step": 290
1026
  },
1027
  {
1028
+ "epoch": 0.00926984126984127,
1029
+ "grad_norm": 1.0546875,
1030
+ "learning_rate": 0.09269841269841271,
1031
+ "loss": 3.6826963424682617,
1032
  "step": 292
1033
  },
1034
  {
1035
+ "epoch": 0.009333333333333334,
1036
+ "grad_norm": 1.3515625,
1037
+ "learning_rate": 0.09333333333333334,
1038
+ "loss": 3.7264299392700195,
1039
  "step": 294
1040
  },
1041
  {
1042
+ "epoch": 0.009396825396825396,
1043
+ "grad_norm": 0.9765625,
1044
+ "learning_rate": 0.09396825396825398,
1045
+ "loss": 3.7098519802093506,
1046
  "step": 296
1047
  },
1048
  {
1049
+ "epoch": 0.00946031746031746,
1050
+ "grad_norm": 0.90234375,
1051
+ "learning_rate": 0.0946031746031746,
1052
+ "loss": 3.676978826522827,
1053
  "step": 298
1054
  },
1055
  {
1056
+ "epoch": 0.009523809523809525,
1057
+ "grad_norm": 0.81640625,
1058
+ "learning_rate": 0.09523809523809523,
1059
+ "loss": 3.687487840652466,
1060
  "step": 300
1061
  },
1062
  {
1063
+ "epoch": 0.009587301587301587,
1064
+ "grad_norm": 1.1484375,
1065
+ "learning_rate": 0.09587301587301589,
1066
+ "loss": 3.673914670944214,
1067
  "step": 302
1068
  },
1069
  {
1070
+ "epoch": 0.009650793650793651,
1071
+ "grad_norm": 1.0625,
1072
+ "learning_rate": 0.09650793650793651,
1073
+ "loss": 3.670208215713501,
1074
  "step": 304
1075
  },
1076
  {
1077
+ "epoch": 0.009714285714285713,
1078
+ "grad_norm": 1.0859375,
1079
+ "learning_rate": 0.09714285714285714,
1080
+ "loss": 3.633423328399658,
1081
  "step": 306
1082
  },
1083
  {
1084
+ "epoch": 0.009777777777777778,
1085
+ "grad_norm": 0.73046875,
1086
+ "learning_rate": 0.09777777777777778,
1087
+ "loss": 3.66752552986145,
1088
  "step": 308
1089
  },
1090
  {
1091
+ "epoch": 0.009841269841269842,
1092
+ "grad_norm": 0.7578125,
1093
+ "learning_rate": 0.09841269841269841,
1094
+ "loss": 3.6017661094665527,
1095
  "step": 310
1096
  },
1097
  {
1098
+ "epoch": 0.009904761904761904,
1099
+ "grad_norm": 0.80078125,
1100
+ "learning_rate": 0.09904761904761905,
1101
+ "loss": 3.6119208335876465,
1102
  "step": 312
1103
  },
1104
  {
1105
+ "epoch": 0.009968253968253968,
1106
+ "grad_norm": 1.359375,
1107
+ "learning_rate": 0.09968253968253969,
1108
+ "loss": 3.6598455905914307,
1109
  "step": 314
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1110
  }
1111
  ],
1112
  "logging_steps": 2,
1113
+ "max_steps": 31500,
1114
  "num_input_tokens_seen": 0,
1115
  "num_train_epochs": 9223372036854775807,
1116
+ "save_steps": 315,
1117
  "stateful_callbacks": {
1118
  "TrainerControl": {
1119
  "args": {
 
1126
  "attributes": {}
1127
  }
1128
  },
1129
+ "total_flos": 1.038138850746611e+18,
1130
  "train_batch_size": 4,
1131
  "trial_name": null,
1132
  "trial_params": null