Text Generation
Transformers
PyTorch
English
hed
howey commited on
Commit
50391a5
·
verified ·
1 Parent(s): 35f998f

Upload 9 files

Browse files

HDT encoder decoder for generation tasks

added_tokens.json ADDED
@@ -0,0 +1,509 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<NLG>": 50269,
3
+ "<NLU>": 50268,
4
+ "<S2S>": 50270,
5
+ "<cls>": 50265,
6
+ "<doc>": 50266,
7
+ "<extra_id_0>": 50771,
8
+ "<extra_id_100>": 50671,
9
+ "<extra_id_101>": 50670,
10
+ "<extra_id_102>": 50669,
11
+ "<extra_id_103>": 50668,
12
+ "<extra_id_104>": 50667,
13
+ "<extra_id_105>": 50666,
14
+ "<extra_id_106>": 50665,
15
+ "<extra_id_107>": 50664,
16
+ "<extra_id_108>": 50663,
17
+ "<extra_id_109>": 50662,
18
+ "<extra_id_10>": 50761,
19
+ "<extra_id_110>": 50661,
20
+ "<extra_id_111>": 50660,
21
+ "<extra_id_112>": 50659,
22
+ "<extra_id_113>": 50658,
23
+ "<extra_id_114>": 50657,
24
+ "<extra_id_115>": 50656,
25
+ "<extra_id_116>": 50655,
26
+ "<extra_id_117>": 50654,
27
+ "<extra_id_118>": 50653,
28
+ "<extra_id_119>": 50652,
29
+ "<extra_id_11>": 50760,
30
+ "<extra_id_120>": 50651,
31
+ "<extra_id_121>": 50650,
32
+ "<extra_id_122>": 50649,
33
+ "<extra_id_123>": 50648,
34
+ "<extra_id_124>": 50647,
35
+ "<extra_id_125>": 50646,
36
+ "<extra_id_126>": 50645,
37
+ "<extra_id_127>": 50644,
38
+ "<extra_id_128>": 50643,
39
+ "<extra_id_129>": 50642,
40
+ "<extra_id_12>": 50759,
41
+ "<extra_id_130>": 50641,
42
+ "<extra_id_131>": 50640,
43
+ "<extra_id_132>": 50639,
44
+ "<extra_id_133>": 50638,
45
+ "<extra_id_134>": 50637,
46
+ "<extra_id_135>": 50636,
47
+ "<extra_id_136>": 50635,
48
+ "<extra_id_137>": 50634,
49
+ "<extra_id_138>": 50633,
50
+ "<extra_id_139>": 50632,
51
+ "<extra_id_13>": 50758,
52
+ "<extra_id_140>": 50631,
53
+ "<extra_id_141>": 50630,
54
+ "<extra_id_142>": 50629,
55
+ "<extra_id_143>": 50628,
56
+ "<extra_id_144>": 50627,
57
+ "<extra_id_145>": 50626,
58
+ "<extra_id_146>": 50625,
59
+ "<extra_id_147>": 50624,
60
+ "<extra_id_148>": 50623,
61
+ "<extra_id_149>": 50622,
62
+ "<extra_id_14>": 50757,
63
+ "<extra_id_150>": 50621,
64
+ "<extra_id_151>": 50620,
65
+ "<extra_id_152>": 50619,
66
+ "<extra_id_153>": 50618,
67
+ "<extra_id_154>": 50617,
68
+ "<extra_id_155>": 50616,
69
+ "<extra_id_156>": 50615,
70
+ "<extra_id_157>": 50614,
71
+ "<extra_id_158>": 50613,
72
+ "<extra_id_159>": 50612,
73
+ "<extra_id_15>": 50756,
74
+ "<extra_id_160>": 50611,
75
+ "<extra_id_161>": 50610,
76
+ "<extra_id_162>": 50609,
77
+ "<extra_id_163>": 50608,
78
+ "<extra_id_164>": 50607,
79
+ "<extra_id_165>": 50606,
80
+ "<extra_id_166>": 50605,
81
+ "<extra_id_167>": 50604,
82
+ "<extra_id_168>": 50603,
83
+ "<extra_id_169>": 50602,
84
+ "<extra_id_16>": 50755,
85
+ "<extra_id_170>": 50601,
86
+ "<extra_id_171>": 50600,
87
+ "<extra_id_172>": 50599,
88
+ "<extra_id_173>": 50598,
89
+ "<extra_id_174>": 50597,
90
+ "<extra_id_175>": 50596,
91
+ "<extra_id_176>": 50595,
92
+ "<extra_id_177>": 50594,
93
+ "<extra_id_178>": 50593,
94
+ "<extra_id_179>": 50592,
95
+ "<extra_id_17>": 50754,
96
+ "<extra_id_180>": 50591,
97
+ "<extra_id_181>": 50590,
98
+ "<extra_id_182>": 50589,
99
+ "<extra_id_183>": 50588,
100
+ "<extra_id_184>": 50587,
101
+ "<extra_id_185>": 50586,
102
+ "<extra_id_186>": 50585,
103
+ "<extra_id_187>": 50584,
104
+ "<extra_id_188>": 50583,
105
+ "<extra_id_189>": 50582,
106
+ "<extra_id_18>": 50753,
107
+ "<extra_id_190>": 50581,
108
+ "<extra_id_191>": 50580,
109
+ "<extra_id_192>": 50579,
110
+ "<extra_id_193>": 50578,
111
+ "<extra_id_194>": 50577,
112
+ "<extra_id_195>": 50576,
113
+ "<extra_id_196>": 50575,
114
+ "<extra_id_197>": 50574,
115
+ "<extra_id_198>": 50573,
116
+ "<extra_id_199>": 50572,
117
+ "<extra_id_19>": 50752,
118
+ "<extra_id_1>": 50770,
119
+ "<extra_id_200>": 50571,
120
+ "<extra_id_201>": 50570,
121
+ "<extra_id_202>": 50569,
122
+ "<extra_id_203>": 50568,
123
+ "<extra_id_204>": 50567,
124
+ "<extra_id_205>": 50566,
125
+ "<extra_id_206>": 50565,
126
+ "<extra_id_207>": 50564,
127
+ "<extra_id_208>": 50563,
128
+ "<extra_id_209>": 50562,
129
+ "<extra_id_20>": 50751,
130
+ "<extra_id_210>": 50561,
131
+ "<extra_id_211>": 50560,
132
+ "<extra_id_212>": 50559,
133
+ "<extra_id_213>": 50558,
134
+ "<extra_id_214>": 50557,
135
+ "<extra_id_215>": 50556,
136
+ "<extra_id_216>": 50555,
137
+ "<extra_id_217>": 50554,
138
+ "<extra_id_218>": 50553,
139
+ "<extra_id_219>": 50552,
140
+ "<extra_id_21>": 50750,
141
+ "<extra_id_220>": 50551,
142
+ "<extra_id_221>": 50550,
143
+ "<extra_id_222>": 50549,
144
+ "<extra_id_223>": 50548,
145
+ "<extra_id_224>": 50547,
146
+ "<extra_id_225>": 50546,
147
+ "<extra_id_226>": 50545,
148
+ "<extra_id_227>": 50544,
149
+ "<extra_id_228>": 50543,
150
+ "<extra_id_229>": 50542,
151
+ "<extra_id_22>": 50749,
152
+ "<extra_id_230>": 50541,
153
+ "<extra_id_231>": 50540,
154
+ "<extra_id_232>": 50539,
155
+ "<extra_id_233>": 50538,
156
+ "<extra_id_234>": 50537,
157
+ "<extra_id_235>": 50536,
158
+ "<extra_id_236>": 50535,
159
+ "<extra_id_237>": 50534,
160
+ "<extra_id_238>": 50533,
161
+ "<extra_id_239>": 50532,
162
+ "<extra_id_23>": 50748,
163
+ "<extra_id_240>": 50531,
164
+ "<extra_id_241>": 50530,
165
+ "<extra_id_242>": 50529,
166
+ "<extra_id_243>": 50528,
167
+ "<extra_id_244>": 50527,
168
+ "<extra_id_245>": 50526,
169
+ "<extra_id_246>": 50525,
170
+ "<extra_id_247>": 50524,
171
+ "<extra_id_248>": 50523,
172
+ "<extra_id_249>": 50522,
173
+ "<extra_id_24>": 50747,
174
+ "<extra_id_250>": 50521,
175
+ "<extra_id_251>": 50520,
176
+ "<extra_id_252>": 50519,
177
+ "<extra_id_253>": 50518,
178
+ "<extra_id_254>": 50517,
179
+ "<extra_id_255>": 50516,
180
+ "<extra_id_256>": 50515,
181
+ "<extra_id_257>": 50514,
182
+ "<extra_id_258>": 50513,
183
+ "<extra_id_259>": 50512,
184
+ "<extra_id_25>": 50746,
185
+ "<extra_id_260>": 50511,
186
+ "<extra_id_261>": 50510,
187
+ "<extra_id_262>": 50509,
188
+ "<extra_id_263>": 50508,
189
+ "<extra_id_264>": 50507,
190
+ "<extra_id_265>": 50506,
191
+ "<extra_id_266>": 50505,
192
+ "<extra_id_267>": 50504,
193
+ "<extra_id_268>": 50503,
194
+ "<extra_id_269>": 50502,
195
+ "<extra_id_26>": 50745,
196
+ "<extra_id_270>": 50501,
197
+ "<extra_id_271>": 50500,
198
+ "<extra_id_272>": 50499,
199
+ "<extra_id_273>": 50498,
200
+ "<extra_id_274>": 50497,
201
+ "<extra_id_275>": 50496,
202
+ "<extra_id_276>": 50495,
203
+ "<extra_id_277>": 50494,
204
+ "<extra_id_278>": 50493,
205
+ "<extra_id_279>": 50492,
206
+ "<extra_id_27>": 50744,
207
+ "<extra_id_280>": 50491,
208
+ "<extra_id_281>": 50490,
209
+ "<extra_id_282>": 50489,
210
+ "<extra_id_283>": 50488,
211
+ "<extra_id_284>": 50487,
212
+ "<extra_id_285>": 50486,
213
+ "<extra_id_286>": 50485,
214
+ "<extra_id_287>": 50484,
215
+ "<extra_id_288>": 50483,
216
+ "<extra_id_289>": 50482,
217
+ "<extra_id_28>": 50743,
218
+ "<extra_id_290>": 50481,
219
+ "<extra_id_291>": 50480,
220
+ "<extra_id_292>": 50479,
221
+ "<extra_id_293>": 50478,
222
+ "<extra_id_294>": 50477,
223
+ "<extra_id_295>": 50476,
224
+ "<extra_id_296>": 50475,
225
+ "<extra_id_297>": 50474,
226
+ "<extra_id_298>": 50473,
227
+ "<extra_id_299>": 50472,
228
+ "<extra_id_29>": 50742,
229
+ "<extra_id_2>": 50769,
230
+ "<extra_id_300>": 50471,
231
+ "<extra_id_301>": 50470,
232
+ "<extra_id_302>": 50469,
233
+ "<extra_id_303>": 50468,
234
+ "<extra_id_304>": 50467,
235
+ "<extra_id_305>": 50466,
236
+ "<extra_id_306>": 50465,
237
+ "<extra_id_307>": 50464,
238
+ "<extra_id_308>": 50463,
239
+ "<extra_id_309>": 50462,
240
+ "<extra_id_30>": 50741,
241
+ "<extra_id_310>": 50461,
242
+ "<extra_id_311>": 50460,
243
+ "<extra_id_312>": 50459,
244
+ "<extra_id_313>": 50458,
245
+ "<extra_id_314>": 50457,
246
+ "<extra_id_315>": 50456,
247
+ "<extra_id_316>": 50455,
248
+ "<extra_id_317>": 50454,
249
+ "<extra_id_318>": 50453,
250
+ "<extra_id_319>": 50452,
251
+ "<extra_id_31>": 50740,
252
+ "<extra_id_320>": 50451,
253
+ "<extra_id_321>": 50450,
254
+ "<extra_id_322>": 50449,
255
+ "<extra_id_323>": 50448,
256
+ "<extra_id_324>": 50447,
257
+ "<extra_id_325>": 50446,
258
+ "<extra_id_326>": 50445,
259
+ "<extra_id_327>": 50444,
260
+ "<extra_id_328>": 50443,
261
+ "<extra_id_329>": 50442,
262
+ "<extra_id_32>": 50739,
263
+ "<extra_id_330>": 50441,
264
+ "<extra_id_331>": 50440,
265
+ "<extra_id_332>": 50439,
266
+ "<extra_id_333>": 50438,
267
+ "<extra_id_334>": 50437,
268
+ "<extra_id_335>": 50436,
269
+ "<extra_id_336>": 50435,
270
+ "<extra_id_337>": 50434,
271
+ "<extra_id_338>": 50433,
272
+ "<extra_id_339>": 50432,
273
+ "<extra_id_33>": 50738,
274
+ "<extra_id_340>": 50431,
275
+ "<extra_id_341>": 50430,
276
+ "<extra_id_342>": 50429,
277
+ "<extra_id_343>": 50428,
278
+ "<extra_id_344>": 50427,
279
+ "<extra_id_345>": 50426,
280
+ "<extra_id_346>": 50425,
281
+ "<extra_id_347>": 50424,
282
+ "<extra_id_348>": 50423,
283
+ "<extra_id_349>": 50422,
284
+ "<extra_id_34>": 50737,
285
+ "<extra_id_350>": 50421,
286
+ "<extra_id_351>": 50420,
287
+ "<extra_id_352>": 50419,
288
+ "<extra_id_353>": 50418,
289
+ "<extra_id_354>": 50417,
290
+ "<extra_id_355>": 50416,
291
+ "<extra_id_356>": 50415,
292
+ "<extra_id_357>": 50414,
293
+ "<extra_id_358>": 50413,
294
+ "<extra_id_359>": 50412,
295
+ "<extra_id_35>": 50736,
296
+ "<extra_id_360>": 50411,
297
+ "<extra_id_361>": 50410,
298
+ "<extra_id_362>": 50409,
299
+ "<extra_id_363>": 50408,
300
+ "<extra_id_364>": 50407,
301
+ "<extra_id_365>": 50406,
302
+ "<extra_id_366>": 50405,
303
+ "<extra_id_367>": 50404,
304
+ "<extra_id_368>": 50403,
305
+ "<extra_id_369>": 50402,
306
+ "<extra_id_36>": 50735,
307
+ "<extra_id_370>": 50401,
308
+ "<extra_id_371>": 50400,
309
+ "<extra_id_372>": 50399,
310
+ "<extra_id_373>": 50398,
311
+ "<extra_id_374>": 50397,
312
+ "<extra_id_375>": 50396,
313
+ "<extra_id_376>": 50395,
314
+ "<extra_id_377>": 50394,
315
+ "<extra_id_378>": 50393,
316
+ "<extra_id_379>": 50392,
317
+ "<extra_id_37>": 50734,
318
+ "<extra_id_380>": 50391,
319
+ "<extra_id_381>": 50390,
320
+ "<extra_id_382>": 50389,
321
+ "<extra_id_383>": 50388,
322
+ "<extra_id_384>": 50387,
323
+ "<extra_id_385>": 50386,
324
+ "<extra_id_386>": 50385,
325
+ "<extra_id_387>": 50384,
326
+ "<extra_id_388>": 50383,
327
+ "<extra_id_389>": 50382,
328
+ "<extra_id_38>": 50733,
329
+ "<extra_id_390>": 50381,
330
+ "<extra_id_391>": 50380,
331
+ "<extra_id_392>": 50379,
332
+ "<extra_id_393>": 50378,
333
+ "<extra_id_394>": 50377,
334
+ "<extra_id_395>": 50376,
335
+ "<extra_id_396>": 50375,
336
+ "<extra_id_397>": 50374,
337
+ "<extra_id_398>": 50373,
338
+ "<extra_id_399>": 50372,
339
+ "<extra_id_39>": 50732,
340
+ "<extra_id_3>": 50768,
341
+ "<extra_id_400>": 50371,
342
+ "<extra_id_401>": 50370,
343
+ "<extra_id_402>": 50369,
344
+ "<extra_id_403>": 50368,
345
+ "<extra_id_404>": 50367,
346
+ "<extra_id_405>": 50366,
347
+ "<extra_id_406>": 50365,
348
+ "<extra_id_407>": 50364,
349
+ "<extra_id_408>": 50363,
350
+ "<extra_id_409>": 50362,
351
+ "<extra_id_40>": 50731,
352
+ "<extra_id_410>": 50361,
353
+ "<extra_id_411>": 50360,
354
+ "<extra_id_412>": 50359,
355
+ "<extra_id_413>": 50358,
356
+ "<extra_id_414>": 50357,
357
+ "<extra_id_415>": 50356,
358
+ "<extra_id_416>": 50355,
359
+ "<extra_id_417>": 50354,
360
+ "<extra_id_418>": 50353,
361
+ "<extra_id_419>": 50352,
362
+ "<extra_id_41>": 50730,
363
+ "<extra_id_420>": 50351,
364
+ "<extra_id_421>": 50350,
365
+ "<extra_id_422>": 50349,
366
+ "<extra_id_423>": 50348,
367
+ "<extra_id_424>": 50347,
368
+ "<extra_id_425>": 50346,
369
+ "<extra_id_426>": 50345,
370
+ "<extra_id_427>": 50344,
371
+ "<extra_id_428>": 50343,
372
+ "<extra_id_429>": 50342,
373
+ "<extra_id_42>": 50729,
374
+ "<extra_id_430>": 50341,
375
+ "<extra_id_431>": 50340,
376
+ "<extra_id_432>": 50339,
377
+ "<extra_id_433>": 50338,
378
+ "<extra_id_434>": 50337,
379
+ "<extra_id_435>": 50336,
380
+ "<extra_id_436>": 50335,
381
+ "<extra_id_437>": 50334,
382
+ "<extra_id_438>": 50333,
383
+ "<extra_id_439>": 50332,
384
+ "<extra_id_43>": 50728,
385
+ "<extra_id_440>": 50331,
386
+ "<extra_id_441>": 50330,
387
+ "<extra_id_442>": 50329,
388
+ "<extra_id_443>": 50328,
389
+ "<extra_id_444>": 50327,
390
+ "<extra_id_445>": 50326,
391
+ "<extra_id_446>": 50325,
392
+ "<extra_id_447>": 50324,
393
+ "<extra_id_448>": 50323,
394
+ "<extra_id_449>": 50322,
395
+ "<extra_id_44>": 50727,
396
+ "<extra_id_450>": 50321,
397
+ "<extra_id_451>": 50320,
398
+ "<extra_id_452>": 50319,
399
+ "<extra_id_453>": 50318,
400
+ "<extra_id_454>": 50317,
401
+ "<extra_id_455>": 50316,
402
+ "<extra_id_456>": 50315,
403
+ "<extra_id_457>": 50314,
404
+ "<extra_id_458>": 50313,
405
+ "<extra_id_459>": 50312,
406
+ "<extra_id_45>": 50726,
407
+ "<extra_id_460>": 50311,
408
+ "<extra_id_461>": 50310,
409
+ "<extra_id_462>": 50309,
410
+ "<extra_id_463>": 50308,
411
+ "<extra_id_464>": 50307,
412
+ "<extra_id_465>": 50306,
413
+ "<extra_id_466>": 50305,
414
+ "<extra_id_467>": 50304,
415
+ "<extra_id_468>": 50303,
416
+ "<extra_id_469>": 50302,
417
+ "<extra_id_46>": 50725,
418
+ "<extra_id_470>": 50301,
419
+ "<extra_id_471>": 50300,
420
+ "<extra_id_472>": 50299,
421
+ "<extra_id_473>": 50298,
422
+ "<extra_id_474>": 50297,
423
+ "<extra_id_475>": 50296,
424
+ "<extra_id_476>": 50295,
425
+ "<extra_id_477>": 50294,
426
+ "<extra_id_478>": 50293,
427
+ "<extra_id_479>": 50292,
428
+ "<extra_id_47>": 50724,
429
+ "<extra_id_480>": 50291,
430
+ "<extra_id_481>": 50290,
431
+ "<extra_id_482>": 50289,
432
+ "<extra_id_483>": 50288,
433
+ "<extra_id_484>": 50287,
434
+ "<extra_id_485>": 50286,
435
+ "<extra_id_486>": 50285,
436
+ "<extra_id_487>": 50284,
437
+ "<extra_id_488>": 50283,
438
+ "<extra_id_489>": 50282,
439
+ "<extra_id_48>": 50723,
440
+ "<extra_id_490>": 50281,
441
+ "<extra_id_491>": 50280,
442
+ "<extra_id_492>": 50279,
443
+ "<extra_id_493>": 50278,
444
+ "<extra_id_494>": 50277,
445
+ "<extra_id_495>": 50276,
446
+ "<extra_id_496>": 50275,
447
+ "<extra_id_497>": 50274,
448
+ "<extra_id_498>": 50273,
449
+ "<extra_id_499>": 50272,
450
+ "<extra_id_49>": 50722,
451
+ "<extra_id_4>": 50767,
452
+ "<extra_id_500>": 50271,
453
+ "<extra_id_50>": 50721,
454
+ "<extra_id_51>": 50720,
455
+ "<extra_id_52>": 50719,
456
+ "<extra_id_53>": 50718,
457
+ "<extra_id_54>": 50717,
458
+ "<extra_id_55>": 50716,
459
+ "<extra_id_56>": 50715,
460
+ "<extra_id_57>": 50714,
461
+ "<extra_id_58>": 50713,
462
+ "<extra_id_59>": 50712,
463
+ "<extra_id_5>": 50766,
464
+ "<extra_id_60>": 50711,
465
+ "<extra_id_61>": 50710,
466
+ "<extra_id_62>": 50709,
467
+ "<extra_id_63>": 50708,
468
+ "<extra_id_64>": 50707,
469
+ "<extra_id_65>": 50706,
470
+ "<extra_id_66>": 50705,
471
+ "<extra_id_67>": 50704,
472
+ "<extra_id_68>": 50703,
473
+ "<extra_id_69>": 50702,
474
+ "<extra_id_6>": 50765,
475
+ "<extra_id_70>": 50701,
476
+ "<extra_id_71>": 50700,
477
+ "<extra_id_72>": 50699,
478
+ "<extra_id_73>": 50698,
479
+ "<extra_id_74>": 50697,
480
+ "<extra_id_75>": 50696,
481
+ "<extra_id_76>": 50695,
482
+ "<extra_id_77>": 50694,
483
+ "<extra_id_78>": 50693,
484
+ "<extra_id_79>": 50692,
485
+ "<extra_id_7>": 50764,
486
+ "<extra_id_80>": 50691,
487
+ "<extra_id_81>": 50690,
488
+ "<extra_id_82>": 50689,
489
+ "<extra_id_83>": 50688,
490
+ "<extra_id_84>": 50687,
491
+ "<extra_id_85>": 50686,
492
+ "<extra_id_86>": 50685,
493
+ "<extra_id_87>": 50684,
494
+ "<extra_id_88>": 50683,
495
+ "<extra_id_89>": 50682,
496
+ "<extra_id_8>": 50763,
497
+ "<extra_id_90>": 50681,
498
+ "<extra_id_91>": 50680,
499
+ "<extra_id_92>": 50679,
500
+ "<extra_id_93>": 50678,
501
+ "<extra_id_94>": 50677,
502
+ "<extra_id_95>": 50676,
503
+ "<extra_id_96>": 50675,
504
+ "<extra_id_97>": 50674,
505
+ "<extra_id_98>": 50673,
506
+ "<extra_id_99>": 50672,
507
+ "<extra_id_9>": 50762,
508
+ "<sec>": 50267
509
+ }
config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "HEDForConditionalGeneration"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 0,
7
+ "classifier_dropout": 0.1,
8
+ "d_ff": 3072,
9
+ "d_kv": 64,
10
+ "d_model": 768,
11
+ "decode_anchor_tokens": false,
12
+ "decoder_start_token_id": 0,
13
+ "dense_act_fn": "relu",
14
+ "dropout_rate": 0.1,
15
+ "eos_token_id": 2,
16
+ "eval_splits": null,
17
+ "feed_forward_proj": "relu",
18
+ "hidden_dropout_prob": 0.1,
19
+ "initializer_factor": 1.0,
20
+ "is_encoder_decoder": true,
21
+ "is_gated_act": false,
22
+ "layer_norm_epsilon": 1e-06,
23
+ "max_decoder_position_embeddings": 512,
24
+ "max_encoder_position_embeddings": 8192,
25
+ "model_type": "hed",
26
+ "num_decoder_layers": 6,
27
+ "num_heads": 12,
28
+ "num_layers": 6,
29
+ "pad_token_id": 1,
30
+ "pool_scheme": "first-token",
31
+ "pos_emb": "scaled-sinusoidal",
32
+ "position_embedding_type": "quaternion",
33
+ "prediction_head": false,
34
+ "relative_attention_max_distance": 128,
35
+ "relative_attention_num_buckets": 32,
36
+ "sep_token_id": 2,
37
+ "torch_dtype": "float32",
38
+ "transformers_version": "4.29.0.dev0",
39
+ "use_bias": false,
40
+ "use_cache": true,
41
+ "vocab_size": 50772
42
+ }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "decoder_start_token_id": 0,
5
+ "eos_token_id": 2,
6
+ "pad_token_id": 1,
7
+ "transformers_version": "4.29.0.dev0"
8
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00e25534b3cb06beac407a374011b110557849e36f6da7f20ef4590eb5868d2b
3
+ size 552487070
special_tokens_map.json ADDED
@@ -0,0 +1,553 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<doc>",
4
+ "<sec>",
5
+ "<NLU>",
6
+ "<NLG>",
7
+ "<S2S>",
8
+ "<extra_id_500>",
9
+ "<extra_id_499>",
10
+ "<extra_id_498>",
11
+ "<extra_id_497>",
12
+ "<extra_id_496>",
13
+ "<extra_id_495>",
14
+ "<extra_id_494>",
15
+ "<extra_id_493>",
16
+ "<extra_id_492>",
17
+ "<extra_id_491>",
18
+ "<extra_id_490>",
19
+ "<extra_id_489>",
20
+ "<extra_id_488>",
21
+ "<extra_id_487>",
22
+ "<extra_id_486>",
23
+ "<extra_id_485>",
24
+ "<extra_id_484>",
25
+ "<extra_id_483>",
26
+ "<extra_id_482>",
27
+ "<extra_id_481>",
28
+ "<extra_id_480>",
29
+ "<extra_id_479>",
30
+ "<extra_id_478>",
31
+ "<extra_id_477>",
32
+ "<extra_id_476>",
33
+ "<extra_id_475>",
34
+ "<extra_id_474>",
35
+ "<extra_id_473>",
36
+ "<extra_id_472>",
37
+ "<extra_id_471>",
38
+ "<extra_id_470>",
39
+ "<extra_id_469>",
40
+ "<extra_id_468>",
41
+ "<extra_id_467>",
42
+ "<extra_id_466>",
43
+ "<extra_id_465>",
44
+ "<extra_id_464>",
45
+ "<extra_id_463>",
46
+ "<extra_id_462>",
47
+ "<extra_id_461>",
48
+ "<extra_id_460>",
49
+ "<extra_id_459>",
50
+ "<extra_id_458>",
51
+ "<extra_id_457>",
52
+ "<extra_id_456>",
53
+ "<extra_id_455>",
54
+ "<extra_id_454>",
55
+ "<extra_id_453>",
56
+ "<extra_id_452>",
57
+ "<extra_id_451>",
58
+ "<extra_id_450>",
59
+ "<extra_id_449>",
60
+ "<extra_id_448>",
61
+ "<extra_id_447>",
62
+ "<extra_id_446>",
63
+ "<extra_id_445>",
64
+ "<extra_id_444>",
65
+ "<extra_id_443>",
66
+ "<extra_id_442>",
67
+ "<extra_id_441>",
68
+ "<extra_id_440>",
69
+ "<extra_id_439>",
70
+ "<extra_id_438>",
71
+ "<extra_id_437>",
72
+ "<extra_id_436>",
73
+ "<extra_id_435>",
74
+ "<extra_id_434>",
75
+ "<extra_id_433>",
76
+ "<extra_id_432>",
77
+ "<extra_id_431>",
78
+ "<extra_id_430>",
79
+ "<extra_id_429>",
80
+ "<extra_id_428>",
81
+ "<extra_id_427>",
82
+ "<extra_id_426>",
83
+ "<extra_id_425>",
84
+ "<extra_id_424>",
85
+ "<extra_id_423>",
86
+ "<extra_id_422>",
87
+ "<extra_id_421>",
88
+ "<extra_id_420>",
89
+ "<extra_id_419>",
90
+ "<extra_id_418>",
91
+ "<extra_id_417>",
92
+ "<extra_id_416>",
93
+ "<extra_id_415>",
94
+ "<extra_id_414>",
95
+ "<extra_id_413>",
96
+ "<extra_id_412>",
97
+ "<extra_id_411>",
98
+ "<extra_id_410>",
99
+ "<extra_id_409>",
100
+ "<extra_id_408>",
101
+ "<extra_id_407>",
102
+ "<extra_id_406>",
103
+ "<extra_id_405>",
104
+ "<extra_id_404>",
105
+ "<extra_id_403>",
106
+ "<extra_id_402>",
107
+ "<extra_id_401>",
108
+ "<extra_id_400>",
109
+ "<extra_id_399>",
110
+ "<extra_id_398>",
111
+ "<extra_id_397>",
112
+ "<extra_id_396>",
113
+ "<extra_id_395>",
114
+ "<extra_id_394>",
115
+ "<extra_id_393>",
116
+ "<extra_id_392>",
117
+ "<extra_id_391>",
118
+ "<extra_id_390>",
119
+ "<extra_id_389>",
120
+ "<extra_id_388>",
121
+ "<extra_id_387>",
122
+ "<extra_id_386>",
123
+ "<extra_id_385>",
124
+ "<extra_id_384>",
125
+ "<extra_id_383>",
126
+ "<extra_id_382>",
127
+ "<extra_id_381>",
128
+ "<extra_id_380>",
129
+ "<extra_id_379>",
130
+ "<extra_id_378>",
131
+ "<extra_id_377>",
132
+ "<extra_id_376>",
133
+ "<extra_id_375>",
134
+ "<extra_id_374>",
135
+ "<extra_id_373>",
136
+ "<extra_id_372>",
137
+ "<extra_id_371>",
138
+ "<extra_id_370>",
139
+ "<extra_id_369>",
140
+ "<extra_id_368>",
141
+ "<extra_id_367>",
142
+ "<extra_id_366>",
143
+ "<extra_id_365>",
144
+ "<extra_id_364>",
145
+ "<extra_id_363>",
146
+ "<extra_id_362>",
147
+ "<extra_id_361>",
148
+ "<extra_id_360>",
149
+ "<extra_id_359>",
150
+ "<extra_id_358>",
151
+ "<extra_id_357>",
152
+ "<extra_id_356>",
153
+ "<extra_id_355>",
154
+ "<extra_id_354>",
155
+ "<extra_id_353>",
156
+ "<extra_id_352>",
157
+ "<extra_id_351>",
158
+ "<extra_id_350>",
159
+ "<extra_id_349>",
160
+ "<extra_id_348>",
161
+ "<extra_id_347>",
162
+ "<extra_id_346>",
163
+ "<extra_id_345>",
164
+ "<extra_id_344>",
165
+ "<extra_id_343>",
166
+ "<extra_id_342>",
167
+ "<extra_id_341>",
168
+ "<extra_id_340>",
169
+ "<extra_id_339>",
170
+ "<extra_id_338>",
171
+ "<extra_id_337>",
172
+ "<extra_id_336>",
173
+ "<extra_id_335>",
174
+ "<extra_id_334>",
175
+ "<extra_id_333>",
176
+ "<extra_id_332>",
177
+ "<extra_id_331>",
178
+ "<extra_id_330>",
179
+ "<extra_id_329>",
180
+ "<extra_id_328>",
181
+ "<extra_id_327>",
182
+ "<extra_id_326>",
183
+ "<extra_id_325>",
184
+ "<extra_id_324>",
185
+ "<extra_id_323>",
186
+ "<extra_id_322>",
187
+ "<extra_id_321>",
188
+ "<extra_id_320>",
189
+ "<extra_id_319>",
190
+ "<extra_id_318>",
191
+ "<extra_id_317>",
192
+ "<extra_id_316>",
193
+ "<extra_id_315>",
194
+ "<extra_id_314>",
195
+ "<extra_id_313>",
196
+ "<extra_id_312>",
197
+ "<extra_id_311>",
198
+ "<extra_id_310>",
199
+ "<extra_id_309>",
200
+ "<extra_id_308>",
201
+ "<extra_id_307>",
202
+ "<extra_id_306>",
203
+ "<extra_id_305>",
204
+ "<extra_id_304>",
205
+ "<extra_id_303>",
206
+ "<extra_id_302>",
207
+ "<extra_id_301>",
208
+ "<extra_id_300>",
209
+ "<extra_id_299>",
210
+ "<extra_id_298>",
211
+ "<extra_id_297>",
212
+ "<extra_id_296>",
213
+ "<extra_id_295>",
214
+ "<extra_id_294>",
215
+ "<extra_id_293>",
216
+ "<extra_id_292>",
217
+ "<extra_id_291>",
218
+ "<extra_id_290>",
219
+ "<extra_id_289>",
220
+ "<extra_id_288>",
221
+ "<extra_id_287>",
222
+ "<extra_id_286>",
223
+ "<extra_id_285>",
224
+ "<extra_id_284>",
225
+ "<extra_id_283>",
226
+ "<extra_id_282>",
227
+ "<extra_id_281>",
228
+ "<extra_id_280>",
229
+ "<extra_id_279>",
230
+ "<extra_id_278>",
231
+ "<extra_id_277>",
232
+ "<extra_id_276>",
233
+ "<extra_id_275>",
234
+ "<extra_id_274>",
235
+ "<extra_id_273>",
236
+ "<extra_id_272>",
237
+ "<extra_id_271>",
238
+ "<extra_id_270>",
239
+ "<extra_id_269>",
240
+ "<extra_id_268>",
241
+ "<extra_id_267>",
242
+ "<extra_id_266>",
243
+ "<extra_id_265>",
244
+ "<extra_id_264>",
245
+ "<extra_id_263>",
246
+ "<extra_id_262>",
247
+ "<extra_id_261>",
248
+ "<extra_id_260>",
249
+ "<extra_id_259>",
250
+ "<extra_id_258>",
251
+ "<extra_id_257>",
252
+ "<extra_id_256>",
253
+ "<extra_id_255>",
254
+ "<extra_id_254>",
255
+ "<extra_id_253>",
256
+ "<extra_id_252>",
257
+ "<extra_id_251>",
258
+ "<extra_id_250>",
259
+ "<extra_id_249>",
260
+ "<extra_id_248>",
261
+ "<extra_id_247>",
262
+ "<extra_id_246>",
263
+ "<extra_id_245>",
264
+ "<extra_id_244>",
265
+ "<extra_id_243>",
266
+ "<extra_id_242>",
267
+ "<extra_id_241>",
268
+ "<extra_id_240>",
269
+ "<extra_id_239>",
270
+ "<extra_id_238>",
271
+ "<extra_id_237>",
272
+ "<extra_id_236>",
273
+ "<extra_id_235>",
274
+ "<extra_id_234>",
275
+ "<extra_id_233>",
276
+ "<extra_id_232>",
277
+ "<extra_id_231>",
278
+ "<extra_id_230>",
279
+ "<extra_id_229>",
280
+ "<extra_id_228>",
281
+ "<extra_id_227>",
282
+ "<extra_id_226>",
283
+ "<extra_id_225>",
284
+ "<extra_id_224>",
285
+ "<extra_id_223>",
286
+ "<extra_id_222>",
287
+ "<extra_id_221>",
288
+ "<extra_id_220>",
289
+ "<extra_id_219>",
290
+ "<extra_id_218>",
291
+ "<extra_id_217>",
292
+ "<extra_id_216>",
293
+ "<extra_id_215>",
294
+ "<extra_id_214>",
295
+ "<extra_id_213>",
296
+ "<extra_id_212>",
297
+ "<extra_id_211>",
298
+ "<extra_id_210>",
299
+ "<extra_id_209>",
300
+ "<extra_id_208>",
301
+ "<extra_id_207>",
302
+ "<extra_id_206>",
303
+ "<extra_id_205>",
304
+ "<extra_id_204>",
305
+ "<extra_id_203>",
306
+ "<extra_id_202>",
307
+ "<extra_id_201>",
308
+ "<extra_id_200>",
309
+ "<extra_id_199>",
310
+ "<extra_id_198>",
311
+ "<extra_id_197>",
312
+ "<extra_id_196>",
313
+ "<extra_id_195>",
314
+ "<extra_id_194>",
315
+ "<extra_id_193>",
316
+ "<extra_id_192>",
317
+ "<extra_id_191>",
318
+ "<extra_id_190>",
319
+ "<extra_id_189>",
320
+ "<extra_id_188>",
321
+ "<extra_id_187>",
322
+ "<extra_id_186>",
323
+ "<extra_id_185>",
324
+ "<extra_id_184>",
325
+ "<extra_id_183>",
326
+ "<extra_id_182>",
327
+ "<extra_id_181>",
328
+ "<extra_id_180>",
329
+ "<extra_id_179>",
330
+ "<extra_id_178>",
331
+ "<extra_id_177>",
332
+ "<extra_id_176>",
333
+ "<extra_id_175>",
334
+ "<extra_id_174>",
335
+ "<extra_id_173>",
336
+ "<extra_id_172>",
337
+ "<extra_id_171>",
338
+ "<extra_id_170>",
339
+ "<extra_id_169>",
340
+ "<extra_id_168>",
341
+ "<extra_id_167>",
342
+ "<extra_id_166>",
343
+ "<extra_id_165>",
344
+ "<extra_id_164>",
345
+ "<extra_id_163>",
346
+ "<extra_id_162>",
347
+ "<extra_id_161>",
348
+ "<extra_id_160>",
349
+ "<extra_id_159>",
350
+ "<extra_id_158>",
351
+ "<extra_id_157>",
352
+ "<extra_id_156>",
353
+ "<extra_id_155>",
354
+ "<extra_id_154>",
355
+ "<extra_id_153>",
356
+ "<extra_id_152>",
357
+ "<extra_id_151>",
358
+ "<extra_id_150>",
359
+ "<extra_id_149>",
360
+ "<extra_id_148>",
361
+ "<extra_id_147>",
362
+ "<extra_id_146>",
363
+ "<extra_id_145>",
364
+ "<extra_id_144>",
365
+ "<extra_id_143>",
366
+ "<extra_id_142>",
367
+ "<extra_id_141>",
368
+ "<extra_id_140>",
369
+ "<extra_id_139>",
370
+ "<extra_id_138>",
371
+ "<extra_id_137>",
372
+ "<extra_id_136>",
373
+ "<extra_id_135>",
374
+ "<extra_id_134>",
375
+ "<extra_id_133>",
376
+ "<extra_id_132>",
377
+ "<extra_id_131>",
378
+ "<extra_id_130>",
379
+ "<extra_id_129>",
380
+ "<extra_id_128>",
381
+ "<extra_id_127>",
382
+ "<extra_id_126>",
383
+ "<extra_id_125>",
384
+ "<extra_id_124>",
385
+ "<extra_id_123>",
386
+ "<extra_id_122>",
387
+ "<extra_id_121>",
388
+ "<extra_id_120>",
389
+ "<extra_id_119>",
390
+ "<extra_id_118>",
391
+ "<extra_id_117>",
392
+ "<extra_id_116>",
393
+ "<extra_id_115>",
394
+ "<extra_id_114>",
395
+ "<extra_id_113>",
396
+ "<extra_id_112>",
397
+ "<extra_id_111>",
398
+ "<extra_id_110>",
399
+ "<extra_id_109>",
400
+ "<extra_id_108>",
401
+ "<extra_id_107>",
402
+ "<extra_id_106>",
403
+ "<extra_id_105>",
404
+ "<extra_id_104>",
405
+ "<extra_id_103>",
406
+ "<extra_id_102>",
407
+ "<extra_id_101>",
408
+ "<extra_id_100>",
409
+ "<extra_id_99>",
410
+ "<extra_id_98>",
411
+ "<extra_id_97>",
412
+ "<extra_id_96>",
413
+ "<extra_id_95>",
414
+ "<extra_id_94>",
415
+ "<extra_id_93>",
416
+ "<extra_id_92>",
417
+ "<extra_id_91>",
418
+ "<extra_id_90>",
419
+ "<extra_id_89>",
420
+ "<extra_id_88>",
421
+ "<extra_id_87>",
422
+ "<extra_id_86>",
423
+ "<extra_id_85>",
424
+ "<extra_id_84>",
425
+ "<extra_id_83>",
426
+ "<extra_id_82>",
427
+ "<extra_id_81>",
428
+ "<extra_id_80>",
429
+ "<extra_id_79>",
430
+ "<extra_id_78>",
431
+ "<extra_id_77>",
432
+ "<extra_id_76>",
433
+ "<extra_id_75>",
434
+ "<extra_id_74>",
435
+ "<extra_id_73>",
436
+ "<extra_id_72>",
437
+ "<extra_id_71>",
438
+ "<extra_id_70>",
439
+ "<extra_id_69>",
440
+ "<extra_id_68>",
441
+ "<extra_id_67>",
442
+ "<extra_id_66>",
443
+ "<extra_id_65>",
444
+ "<extra_id_64>",
445
+ "<extra_id_63>",
446
+ "<extra_id_62>",
447
+ "<extra_id_61>",
448
+ "<extra_id_60>",
449
+ "<extra_id_59>",
450
+ "<extra_id_58>",
451
+ "<extra_id_57>",
452
+ "<extra_id_56>",
453
+ "<extra_id_55>",
454
+ "<extra_id_54>",
455
+ "<extra_id_53>",
456
+ "<extra_id_52>",
457
+ "<extra_id_51>",
458
+ "<extra_id_50>",
459
+ "<extra_id_49>",
460
+ "<extra_id_48>",
461
+ "<extra_id_47>",
462
+ "<extra_id_46>",
463
+ "<extra_id_45>",
464
+ "<extra_id_44>",
465
+ "<extra_id_43>",
466
+ "<extra_id_42>",
467
+ "<extra_id_41>",
468
+ "<extra_id_40>",
469
+ "<extra_id_39>",
470
+ "<extra_id_38>",
471
+ "<extra_id_37>",
472
+ "<extra_id_36>",
473
+ "<extra_id_35>",
474
+ "<extra_id_34>",
475
+ "<extra_id_33>",
476
+ "<extra_id_32>",
477
+ "<extra_id_31>",
478
+ "<extra_id_30>",
479
+ "<extra_id_29>",
480
+ "<extra_id_28>",
481
+ "<extra_id_27>",
482
+ "<extra_id_26>",
483
+ "<extra_id_25>",
484
+ "<extra_id_24>",
485
+ "<extra_id_23>",
486
+ "<extra_id_22>",
487
+ "<extra_id_21>",
488
+ "<extra_id_20>",
489
+ "<extra_id_19>",
490
+ "<extra_id_18>",
491
+ "<extra_id_17>",
492
+ "<extra_id_16>",
493
+ "<extra_id_15>",
494
+ "<extra_id_14>",
495
+ "<extra_id_13>",
496
+ "<extra_id_12>",
497
+ "<extra_id_11>",
498
+ "<extra_id_10>",
499
+ "<extra_id_9>",
500
+ "<extra_id_8>",
501
+ "<extra_id_7>",
502
+ "<extra_id_6>",
503
+ "<extra_id_5>",
504
+ "<extra_id_4>",
505
+ "<extra_id_3>",
506
+ "<extra_id_2>",
507
+ "<extra_id_1>",
508
+ "<extra_id_0>"
509
+ ],
510
+ "bos_token": {
511
+ "content": "<s>",
512
+ "lstrip": false,
513
+ "normalized": true,
514
+ "rstrip": false,
515
+ "single_word": false
516
+ },
517
+ "cls_token": "<cls>",
518
+ "eos_token": {
519
+ "content": "</s>",
520
+ "lstrip": false,
521
+ "normalized": true,
522
+ "rstrip": false,
523
+ "single_word": false
524
+ },
525
+ "mask_token": {
526
+ "content": "<mask>",
527
+ "lstrip": true,
528
+ "normalized": true,
529
+ "rstrip": false,
530
+ "single_word": false
531
+ },
532
+ "pad_token": {
533
+ "content": "<pad>",
534
+ "lstrip": false,
535
+ "normalized": true,
536
+ "rstrip": false,
537
+ "single_word": false
538
+ },
539
+ "sep_token": {
540
+ "content": "</s>",
541
+ "lstrip": false,
542
+ "normalized": true,
543
+ "rstrip": false,
544
+ "single_word": false
545
+ },
546
+ "unk_token": {
547
+ "content": "<unk>",
548
+ "lstrip": false,
549
+ "normalized": true,
550
+ "rstrip": false,
551
+ "single_word": false
552
+ }
553
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": {
4
+ "__type": "AddedToken",
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "clean_up_tokenization_spaces": true,
12
+ "cls_token": {
13
+ "__type": "AddedToken",
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": true,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ },
20
+ "eos_token": {
21
+ "__type": "AddedToken",
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": true,
25
+ "rstrip": false,
26
+ "single_word": false
27
+ },
28
+ "errors": "replace",
29
+ "mask_token": {
30
+ "__type": "AddedToken",
31
+ "content": "<mask>",
32
+ "lstrip": true,
33
+ "normalized": true,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "model_max_length": 16384,
38
+ "pad_token": {
39
+ "__type": "AddedToken",
40
+ "content": "<pad>",
41
+ "lstrip": false,
42
+ "normalized": true,
43
+ "rstrip": false,
44
+ "single_word": false
45
+ },
46
+ "sep_token": {
47
+ "__type": "AddedToken",
48
+ "content": "</s>",
49
+ "lstrip": false,
50
+ "normalized": true,
51
+ "rstrip": false,
52
+ "single_word": false
53
+ },
54
+ "tokenizer_class": "LEDTokenizer",
55
+ "trim_offsets": true,
56
+ "unk_token": {
57
+ "__type": "AddedToken",
58
+ "content": "<unk>",
59
+ "lstrip": false,
60
+ "normalized": true,
61
+ "rstrip": false,
62
+ "single_word": false
63
+ }
64
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff