deskull commited on
Commit
23ff05c
·
verified ·
1 Parent(s): 98704b5

Upload MolCrawl compounds GPT-2 medium model

Browse files
config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "GPT2LMHeadModel"
4
+ ],
5
+ "model_type": "gpt2",
6
+ "vocab_size": 612,
7
+ "n_positions": 1024,
8
+ "n_ctx": 1024,
9
+ "n_embd": 1024,
10
+ "n_layer": 24,
11
+ "n_head": 16,
12
+ "n_inner": 4096,
13
+ "activation_function": "gelu_new",
14
+ "resid_pdrop": 0.0,
15
+ "embd_pdrop": 0.0,
16
+ "attn_pdrop": 0.0,
17
+ "layer_norm_epsilon": 1e-05,
18
+ "initializer_range": 0.02,
19
+ "use_cache": true,
20
+ "bos_token_id": 0,
21
+ "eos_token_id": 0,
22
+ "transformers_version": "4.0.0",
23
+ "_name_or_path": "riken-gpt2",
24
+ "_riken_model_args": {
25
+ "n_layer": 24,
26
+ "n_head": 16,
27
+ "n_embd": 1024,
28
+ "block_size": 1024,
29
+ "bias": false,
30
+ "vocab_size": 612,
31
+ "dropout": 0.0
32
+ },
33
+ "_riken_bias": false
34
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa27704b376efe3207324b9c28b5bfa81fdee9740de4482514698b955ac9263f
3
+ size 1214910447
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
@@ -0,0 +1,681 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "[PAD]",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 11,
17
+ "content": "[UNK]",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 12,
26
+ "content": "[CLS]",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 13,
35
+ "content": "[SEP]",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 14,
44
+ "content": "[MASK]",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ }
51
+ ],
52
+ "normalizer": null,
53
+ "pre_tokenizer": {
54
+ "type": "Split",
55
+ "pattern": {
56
+ "Regex": "(\\[[^\\]]+]|Br?|Cl?|N|O|S|P|F|I|b|c|n|o|s|p|\\(|\\)|\\.|=|#|-|\\+|\\\\|\\/|:|~|@|\\?|>>?|\\*|\\$|\\%[0-9]{2}|[0-9])"
57
+ },
58
+ "behavior": "Isolated",
59
+ "invert": false
60
+ },
61
+ "post_processor": null,
62
+ "decoder": null,
63
+ "model": {
64
+ "type": "WordLevel",
65
+ "vocab": {
66
+ "[PAD]": 0,
67
+ "[unused1]": 1,
68
+ "[unused2]": 2,
69
+ "[unused3]": 3,
70
+ "[unused4]": 4,
71
+ "[unused5]": 5,
72
+ "[unused6]": 6,
73
+ "[unused7]": 7,
74
+ "[unused8]": 8,
75
+ "[unused9]": 9,
76
+ "[unused10]": 10,
77
+ "[UNK]": 11,
78
+ "[CLS]": 12,
79
+ "[SEP]": 13,
80
+ "[MASK]": 14,
81
+ "c": 15,
82
+ "C": 16,
83
+ "(": 17,
84
+ ")": 18,
85
+ "O": 19,
86
+ "1": 20,
87
+ "2": 21,
88
+ "=": 22,
89
+ "N": 23,
90
+ ".": 24,
91
+ "n": 25,
92
+ "3": 26,
93
+ "F": 27,
94
+ "Cl": 28,
95
+ ">>": 29,
96
+ "~": 30,
97
+ "-": 31,
98
+ "4": 32,
99
+ "[C@H]": 33,
100
+ "S": 34,
101
+ "[C@@H]": 35,
102
+ "[O-]": 36,
103
+ "Br": 37,
104
+ "#": 38,
105
+ "/": 39,
106
+ "[nH]": 40,
107
+ "[N+]": 41,
108
+ "s": 42,
109
+ "5": 43,
110
+ "o": 44,
111
+ "P": 45,
112
+ "[Na+]": 46,
113
+ "[Si]": 47,
114
+ "I": 48,
115
+ "[Na]": 49,
116
+ "[Pd]": 50,
117
+ "[K+]": 51,
118
+ "[K]": 52,
119
+ "[P]": 53,
120
+ "B": 54,
121
+ "[C@]": 55,
122
+ "[C@@]": 56,
123
+ "[Cl-]": 57,
124
+ "6": 58,
125
+ "[OH-]": 59,
126
+ "\\": 60,
127
+ "[N-]": 61,
128
+ "[Li]": 62,
129
+ "[H]": 63,
130
+ "[2H]": 64,
131
+ "[NH4+]": 65,
132
+ "[c-]": 66,
133
+ "[P-]": 67,
134
+ "[Cs+]": 68,
135
+ "[Li+]": 69,
136
+ "[Cs]": 70,
137
+ "[NaH]": 71,
138
+ "[H-]": 72,
139
+ "[O+]": 73,
140
+ "[BH4-]": 74,
141
+ "[Cu]": 75,
142
+ "7": 76,
143
+ "[Mg]": 77,
144
+ "[Fe+2]": 78,
145
+ "[n+]": 79,
146
+ "[Sn]": 80,
147
+ "[BH-]": 81,
148
+ "[Pd+2]": 82,
149
+ "[CH]": 83,
150
+ "[I-]": 84,
151
+ "[Br-]": 85,
152
+ "[C-]": 86,
153
+ "[Zn]": 87,
154
+ "[B-]": 88,
155
+ "[F-]": 89,
156
+ "[Al]": 90,
157
+ "[P+]": 91,
158
+ "[BH3-]": 92,
159
+ "[Fe]": 93,
160
+ "[C]": 94,
161
+ "[AlH4]": 95,
162
+ "[Ni]": 96,
163
+ "[SiH]": 97,
164
+ "8": 98,
165
+ "[Cu+2]": 99,
166
+ "[Mn]": 100,
167
+ "[AlH]": 101,
168
+ "[nH+]": 102,
169
+ "[AlH4-]": 103,
170
+ "[O-2]": 104,
171
+ "[Cr]": 105,
172
+ "[Mg+2]": 106,
173
+ "[NH3+]": 107,
174
+ "[S@]": 108,
175
+ "[Pt]": 109,
176
+ "[Al+3]": 110,
177
+ "[S@@]": 111,
178
+ "[S-]": 112,
179
+ "[Ti]": 113,
180
+ "[Zn+2]": 114,
181
+ "[PH]": 115,
182
+ "[NH2+]": 116,
183
+ "[Ru]": 117,
184
+ "[Ag+]": 118,
185
+ "[S+]": 119,
186
+ "[I+3]": 120,
187
+ "[NH+]": 121,
188
+ "[Ca+2]": 122,
189
+ "[Ag]": 123,
190
+ "9": 124,
191
+ "[Os]": 125,
192
+ "[Se]": 126,
193
+ "[SiH2]": 127,
194
+ "[Ca]": 128,
195
+ "[Ti+4]": 129,
196
+ "[Ac]": 130,
197
+ "[Cu+]": 131,
198
+ "[S]": 132,
199
+ "[Rh]": 133,
200
+ "[Cl+3]": 134,
201
+ "[cH-]": 135,
202
+ "[Zn+]": 136,
203
+ "[O]": 137,
204
+ "[Cl+]": 138,
205
+ "[SH]": 139,
206
+ "[H+]": 140,
207
+ "[Pd+]": 141,
208
+ "[se]": 142,
209
+ "[PH+]": 143,
210
+ "[I]": 144,
211
+ "[Pt+2]": 145,
212
+ "[C+]": 146,
213
+ "[Mg+]": 147,
214
+ "[Hg]": 148,
215
+ "[W]": 149,
216
+ "[SnH]": 150,
217
+ "[SiH3]": 151,
218
+ "[Fe+3]": 152,
219
+ "[NH]": 153,
220
+ "[Mo]": 154,
221
+ "[CH2+]": 155,
222
+ "%10": 156,
223
+ "[CH2-]": 157,
224
+ "[CH2]": 158,
225
+ "[n-]": 159,
226
+ "[Ce+4]": 160,
227
+ "[NH-]": 161,
228
+ "[Co]": 162,
229
+ "[I+]": 163,
230
+ "[PH2]": 164,
231
+ "[Pt+4]": 165,
232
+ "[Ce]": 166,
233
+ "[B]": 167,
234
+ "[Sn+2]": 168,
235
+ "[Ba+2]": 169,
236
+ "%11": 170,
237
+ "[Fe-3]": 171,
238
+ "[18F]": 172,
239
+ "[SH-]": 173,
240
+ "[Pb+2]": 174,
241
+ "[Os-2]": 175,
242
+ "[Zr+4]": 176,
243
+ "[N]": 177,
244
+ "[Ir]": 178,
245
+ "[Bi]": 179,
246
+ "[Ni+2]": 180,
247
+ "[P@]": 181,
248
+ "[Co+2]": 182,
249
+ "[s+]": 183,
250
+ "[As]": 184,
251
+ "[P+3]": 185,
252
+ "[Hg+2]": 186,
253
+ "[Yb+3]": 187,
254
+ "[CH-]": 188,
255
+ "[Zr+2]": 189,
256
+ "[Mn+2]": 190,
257
+ "[CH+]": 191,
258
+ "[In]": 192,
259
+ "[KH]": 193,
260
+ "[Ce+3]": 194,
261
+ "[Zr]": 195,
262
+ "[AlH2-]": 196,
263
+ "[OH2+]": 197,
264
+ "[Ti+3]": 198,
265
+ "[Rh+2]": 199,
266
+ "[Sb]": 200,
267
+ "[S-2]": 201,
268
+ "%12": 202,
269
+ "[P@@]": 203,
270
+ "[Si@H]": 204,
271
+ "[Mn+4]": 205,
272
+ "p": 206,
273
+ "[Ba]": 207,
274
+ "[NH2-]": 208,
275
+ "[Ge]": 209,
276
+ "[Pb+4]": 210,
277
+ "[Cr+3]": 211,
278
+ "[Au]": 212,
279
+ "[LiH]": 213,
280
+ "[Sc+3]": 214,
281
+ "[o+]": 215,
282
+ "[Rh-3]": 216,
283
+ "%13": 217,
284
+ "[Br]": 218,
285
+ "[Sb-]": 219,
286
+ "[S@+]": 220,
287
+ "[I+2]": 221,
288
+ "[Ar]": 222,
289
+ "[V]": 223,
290
+ "[Cu-]": 224,
291
+ "[Al-]": 225,
292
+ "[Te]": 226,
293
+ "[13c]": 227,
294
+ "[13C]": 228,
295
+ "[Cl]": 229,
296
+ "[PH4+]": 230,
297
+ "[SiH4]": 231,
298
+ "[te]": 232,
299
+ "[CH3-]": 233,
300
+ "[S@@+]": 234,
301
+ "[Rh+3]": 235,
302
+ "[SH+]": 236,
303
+ "[Bi+3]": 237,
304
+ "[Br+2]": 238,
305
+ "[La]": 239,
306
+ "[La+3]": 240,
307
+ "[Pt-2]": 241,
308
+ "[N@@]": 242,
309
+ "[PH3+]": 243,
310
+ "[N@]": 244,
311
+ "[Si+4]": 245,
312
+ "[Sr+2]": 246,
313
+ "[Al+]": 247,
314
+ "[Pb]": 248,
315
+ "[SeH]": 249,
316
+ "[Si-]": 250,
317
+ "[V+5]": 251,
318
+ "[Y+3]": 252,
319
+ "[Re]": 253,
320
+ "[Ru+]": 254,
321
+ "[Sm]": 255,
322
+ "*": 256,
323
+ "[3H]": 257,
324
+ "[NH2]": 258,
325
+ "[Ag-]": 259,
326
+ "[13CH3]": 260,
327
+ "[OH+]": 261,
328
+ "[Ru+3]": 262,
329
+ "[OH]": 263,
330
+ "[Gd+3]": 264,
331
+ "[13CH2]": 265,
332
+ "[In+3]": 266,
333
+ "[Si@@]": 267,
334
+ "[Si@]": 268,
335
+ "[Ti+2]": 269,
336
+ "[Sn+]": 270,
337
+ "[Cl+2]": 271,
338
+ "[AlH-]": 272,
339
+ "[Pd-2]": 273,
340
+ "[SnH3]": 274,
341
+ "[B+3]": 275,
342
+ "[Cu-2]": 276,
343
+ "[Nd+3]": 277,
344
+ "[Pb+3]": 278,
345
+ "[13cH]": 279,
346
+ "[Fe-4]": 280,
347
+ "[Ga]": 281,
348
+ "[Sn+4]": 282,
349
+ "[Hg+]": 283,
350
+ "[11CH3]": 284,
351
+ "[Hf]": 285,
352
+ "[Pr]": 286,
353
+ "[Y]": 287,
354
+ "[S+2]": 288,
355
+ "[Cd]": 289,
356
+ "[Cr+6]": 290,
357
+ "[Zr+3]": 291,
358
+ "[Rh+]": 292,
359
+ "[CH3]": 293,
360
+ "[N-3]": 294,
361
+ "[Hf+2]": 295,
362
+ "[Th]": 296,
363
+ "[Sb+3]": 297,
364
+ "%14": 298,
365
+ "[Cr+2]": 299,
366
+ "[Ru+2]": 300,
367
+ "[Hf+4]": 301,
368
+ "[14C]": 302,
369
+ "[Ta]": 303,
370
+ "[Tl+]": 304,
371
+ "[B+]": 305,
372
+ "[Os+4]": 306,
373
+ "[PdH2]": 307,
374
+ "[Pd-]": 308,
375
+ "[Cd+2]": 309,
376
+ "[Co+3]": 310,
377
+ "[S+4]": 311,
378
+ "[Nb+5]": 312,
379
+ "[123I]": 313,
380
+ "[c+]": 314,
381
+ "[Rb+]": 315,
382
+ "[V+2]": 316,
383
+ "[CH3+]": 317,
384
+ "[Ag+2]": 318,
385
+ "[cH+]": 319,
386
+ "[Mn+3]": 320,
387
+ "[Se-]": 321,
388
+ "[As-]": 322,
389
+ "[Eu+3]": 323,
390
+ "[SH2]": 324,
391
+ "[Sm+3]": 325,
392
+ "[IH+]": 326,
393
+ "%15": 327,
394
+ "[OH3+]": 328,
395
+ "[PH3]": 329,
396
+ "[IH2+]": 330,
397
+ "[SH2+]": 331,
398
+ "[Ir+3]": 332,
399
+ "[AlH3]": 333,
400
+ "[Sc]": 334,
401
+ "[Yb]": 335,
402
+ "[15NH2]": 336,
403
+ "[Lu]": 337,
404
+ "[sH+]": 338,
405
+ "[Gd]": 339,
406
+ "[18F-]": 340,
407
+ "[SH3+]": 341,
408
+ "[SnH4]": 342,
409
+ "[TeH]": 343,
410
+ "[Si@@H]": 344,
411
+ "[Ga+3]": 345,
412
+ "[CaH2]": 346,
413
+ "[Tl]": 347,
414
+ "[Ta+5]": 348,
415
+ "[GeH]": 349,
416
+ "[Br+]": 350,
417
+ "[Sr]": 351,
418
+ "[Tl+3]": 352,
419
+ "[Sm+2]": 353,
420
+ "[PH5]": 354,
421
+ "%16": 355,
422
+ "[N@@+]": 356,
423
+ "[Au+3]": 357,
424
+ "[C-4]": 358,
425
+ "[Nd]": 359,
426
+ "[Ti+]": 360,
427
+ "[IH]": 361,
428
+ "[N@+]": 362,
429
+ "[125I]": 363,
430
+ "[Eu]": 364,
431
+ "[Sn+3]": 365,
432
+ "[Nb]": 366,
433
+ "[Er+3]": 367,
434
+ "[123I-]": 368,
435
+ "[14c]": 369,
436
+ "%17": 370,
437
+ "[SnH2]": 371,
438
+ "[YH]": 372,
439
+ "[Sb+5]": 373,
440
+ "[Pr+3]": 374,
441
+ "[Ir+]": 375,
442
+ "[N+3]": 376,
443
+ "[AlH2]": 377,
444
+ "[19F]": 378,
445
+ "%18": 379,
446
+ "[Tb]": 380,
447
+ "[14CH]": 381,
448
+ "[Mo+4]": 382,
449
+ "[Si+]": 383,
450
+ "[BH]": 384,
451
+ "[Be]": 385,
452
+ "[Rb]": 386,
453
+ "[pH]": 387,
454
+ "%19": 388,
455
+ "%20": 389,
456
+ "[Xe]": 390,
457
+ "[Ir-]": 391,
458
+ "[Be+2]": 392,
459
+ "[C+4]": 393,
460
+ "[RuH2]": 394,
461
+ "[15NH]": 395,
462
+ "[U+2]": 396,
463
+ "[Au-]": 397,
464
+ "%21": 398,
465
+ "%22": 399,
466
+ "[Au+]": 400,
467
+ "[15n]": 401,
468
+ "[Al+2]": 402,
469
+ "[Tb+3]": 403,
470
+ "[15N]": 404,
471
+ "[V+3]": 405,
472
+ "[W+6]": 406,
473
+ "[14CH3]": 407,
474
+ "[Cr+4]": 408,
475
+ "[ClH+]": 409,
476
+ "b": 410,
477
+ "[Ti+6]": 411,
478
+ "[Nd+]": 412,
479
+ "[Zr+]": 413,
480
+ "[PH2+]": 414,
481
+ "[Fm]": 415,
482
+ "[N@H+]": 416,
483
+ "[RuH]": 417,
484
+ "[Dy+3]": 418,
485
+ "%23": 419,
486
+ "[Hf+3]": 420,
487
+ "[W+4]": 421,
488
+ "[11C]": 422,
489
+ "[13CH]": 423,
490
+ "[Er]": 424,
491
+ "[124I]": 425,
492
+ "[LaH]": 426,
493
+ "[F]": 427,
494
+ "[siH]": 428,
495
+ "[Ga+]": 429,
496
+ "[Cm]": 430,
497
+ "[GeH3]": 431,
498
+ "[IH-]": 432,
499
+ "[U+6]": 433,
500
+ "[SeH+]": 434,
501
+ "[32P]": 435,
502
+ "[SeH-]": 436,
503
+ "[Pt-]": 437,
504
+ "[Ir+2]": 438,
505
+ "[se+]": 439,
506
+ "[U]": 440,
507
+ "[F+]": 441,
508
+ "[BH2]": 442,
509
+ "[As+]": 443,
510
+ "[Cf]": 444,
511
+ "[ClH2+]": 445,
512
+ "[Ni+]": 446,
513
+ "[TeH3]": 447,
514
+ "[SbH2]": 448,
515
+ "[Ag+3]": 449,
516
+ "%24": 450,
517
+ "[18O]": 451,
518
+ "[PH4]": 452,
519
+ "[Os+2]": 453,
520
+ "[Na-]": 454,
521
+ "[Sb+2]": 455,
522
+ "[V+4]": 456,
523
+ "[Ho+3]": 457,
524
+ "[68Ga]": 458,
525
+ "[PH-]": 459,
526
+ "[Bi+2]": 460,
527
+ "[Ce+2]": 461,
528
+ "[Pd+3]": 462,
529
+ "[99Tc]": 463,
530
+ "[13C@@H]": 464,
531
+ "[Fe+6]": 465,
532
+ "[c]": 466,
533
+ "[GeH2]": 467,
534
+ "[10B]": 468,
535
+ "[Cu+3]": 469,
536
+ "[Mo+2]": 470,
537
+ "[Cr+]": 471,
538
+ "[Pd+4]": 472,
539
+ "[Dy]": 473,
540
+ "[AsH]": 474,
541
+ "[Ba+]": 475,
542
+ "[SeH2]": 476,
543
+ "[In+]": 477,
544
+ "[TeH2]": 478,
545
+ "[BrH+]": 479,
546
+ "[14cH]": 480,
547
+ "[W+]": 481,
548
+ "[13C@H]": 482,
549
+ "[AsH2]": 483,
550
+ "[In+2]": 484,
551
+ "[N+2]": 485,
552
+ "[N@@H+]": 486,
553
+ "[SbH]": 487,
554
+ "[60Co]": 488,
555
+ "[AsH4+]": 489,
556
+ "[AsH3]": 490,
557
+ "[18OH]": 491,
558
+ "[Ru-2]": 492,
559
+ "[Na-2]": 493,
560
+ "[CuH2]": 494,
561
+ "[31P]": 495,
562
+ "[Ti+5]": 496,
563
+ "[35S]": 497,
564
+ "[P@@H]": 498,
565
+ "[ArH]": 499,
566
+ "[Co+]": 500,
567
+ "[Zr-2]": 501,
568
+ "[BH2-]": 502,
569
+ "[131I]": 503,
570
+ "[SH5]": 504,
571
+ "[VH]": 505,
572
+ "[B+2]": 506,
573
+ "[Yb+2]": 507,
574
+ "[14C@H]": 508,
575
+ "[211At]": 509,
576
+ "[NH3+2]": 510,
577
+ "[IrH]": 511,
578
+ "[IrH2]": 512,
579
+ "[Rh-]": 513,
580
+ "[Cr-]": 514,
581
+ "[Sb+]": 515,
582
+ "[Ni+3]": 516,
583
+ "[TaH3]": 517,
584
+ "[Tl+2]": 518,
585
+ "[64Cu]": 519,
586
+ "[Tc]": 520,
587
+ "[Cd+]": 521,
588
+ "[1H]": 522,
589
+ "[15nH]": 523,
590
+ "[AlH2+]": 524,
591
+ "[FH+2]": 525,
592
+ "[BiH3]": 526,
593
+ "[Ru-]": 527,
594
+ "[Mo+6]": 528,
595
+ "[AsH+]": 529,
596
+ "[BaH2]": 530,
597
+ "[BaH]": 531,
598
+ "[Fe+4]": 532,
599
+ "[229Th]": 533,
600
+ "[Th+4]": 534,
601
+ "[As+3]": 535,
602
+ "[NH+3]": 536,
603
+ "[P@H]": 537,
604
+ "[Li-]": 538,
605
+ "[7NaH]": 539,
606
+ "[Bi+]": 540,
607
+ "[PtH+2]": 541,
608
+ "[p-]": 542,
609
+ "[Re+5]": 543,
610
+ "[NiH]": 544,
611
+ "[Ni-]": 545,
612
+ "[Xe+]": 546,
613
+ "[Ca+]": 547,
614
+ "[11c]": 548,
615
+ "[Rh+4]": 549,
616
+ "[AcH]": 550,
617
+ "[HeH]": 551,
618
+ "[Sc+2]": 552,
619
+ "[Mn+]": 553,
620
+ "[UH]": 554,
621
+ "[14CH2]": 555,
622
+ "[SiH4+]": 556,
623
+ "[18OH2]": 557,
624
+ "[Ac-]": 558,
625
+ "[Re+4]": 559,
626
+ "[118Sn]": 560,
627
+ "[153Sm]": 561,
628
+ "[P+2]": 562,
629
+ "[9CH]": 563,
630
+ "[9CH3]": 564,
631
+ "[Y-]": 565,
632
+ "[NiH2]": 566,
633
+ "[Si+2]": 567,
634
+ "[Mn+6]": 568,
635
+ "[ZrH2]": 569,
636
+ "[C-2]": 570,
637
+ "[Bi+5]": 571,
638
+ "[24NaH]": 572,
639
+ "[Fr]": 573,
640
+ "[15CH]": 574,
641
+ "[Se+]": 575,
642
+ "[At]": 576,
643
+ "[P-3]": 577,
644
+ "[124I-]": 578,
645
+ "[CuH2-]": 579,
646
+ "[Nb+4]": 580,
647
+ "[Nb+3]": 581,
648
+ "[MgH]": 582,
649
+ "[Ir+4]": 583,
650
+ "[67Ga+3]": 584,
651
+ "[67Ga]": 585,
652
+ "[13N]": 586,
653
+ "[15OH2]": 587,
654
+ "[2NH]": 588,
655
+ "[Ho]": 589,
656
+ "[Cn]": 590,
657
+ "[0*]": 591,
658
+ "[1*]": 592,
659
+ "[2*]": 593,
660
+ "[3*]": 594,
661
+ "[4*]": 595,
662
+ "[5*]": 596,
663
+ "[6*]": 597,
664
+ "[7*]": 598,
665
+ "[8*]": 599,
666
+ "[9*]": 600,
667
+ "[10*]": 601,
668
+ "[11*]": 602,
669
+ "[12*]": 603,
670
+ "[13*]": 604,
671
+ "[14*]": 605,
672
+ "[15*]": 606,
673
+ "[16*]": 607,
674
+ "[17*]": 608,
675
+ "[18*]": 609,
676
+ "[19*]": 610,
677
+ "[20*]": 611
678
+ },
679
+ "unk_token": "[UNK]"
680
+ }
681
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "11": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "12": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "13": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "14": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": false,
45
+ "cls_token": "[CLS]",
46
+ "mask_token": "[MASK]",
47
+ "model_max_length": 1000000000000000019884624838656,
48
+ "pad_token": "[PAD]",
49
+ "sep_token": "[SEP]",
50
+ "tokenizer_class": "PreTrainedTokenizerFast",
51
+ "unk_token": "[UNK]"
52
+ }
training_args.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "iteration": 30000,
3
+ "best_val_loss": 0.03033723682165146,
4
+ "early_stopping_counter": 11,
5
+ "learning_rate": 6e-07,
6
+ "batch_size": 2,
7
+ "block_size": 1024,
8
+ "model_args": {
9
+ "n_layer": 24,
10
+ "n_head": 16,
11
+ "n_embd": 1024,
12
+ "block_size": 1024,
13
+ "bias": false,
14
+ "vocab_size": 612,
15
+ "dropout": 0.0
16
+ }
17
+ }