CocoRoF commited on
Commit
8e392ba
·
verified ·
1 Parent(s): d28b45f

Training in progress, step 7000, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "x2bee/KoModernBERT-base-mlm-v03-retry-ckp03",
3
  "architectures": [
4
  "ModernBERTSimCSE"
5
  ],
@@ -43,5 +43,5 @@
43
  "sparse_prediction": false,
44
  "torch_dtype": "float32",
45
  "transformers_version": "4.48.0.dev0",
46
- "vocab_size": 95663
47
  }
 
1
  {
2
+ "_name_or_path": "CocoRoF/KoModernBERT-chp-11",
3
  "architectures": [
4
  "ModernBERTSimCSE"
5
  ],
 
43
  "sparse_prediction": false,
44
  "torch_dtype": "float32",
45
  "transformers_version": "4.48.0.dev0",
46
+ "vocab_size": 55111
47
  }
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:703b75465ed45e4a47b755f4dbf7613f34e8cb9a9c6557491a46a67bc25a57ef
3
- size 737580392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:039eb5c73d0c30d604c0b44c1ce93e67f4cad28867b354ed01f17480dad76a76
3
+ size 613004648
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:943fd807c0afa2eb74111f9b3a9e2bfca879f4ad22f91c7601145761a7d127c8
3
- size 1475248442
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc06b5cbd2ac7683e57b1ae52249f53d8b5ccf8cd27718ad72fba95231fa2073
3
+ size 1226096954
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:774612f2d4811ca7da639cec8d3b509c1f87b5ffc57761546af6466447a0619a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9819055317e0aa1215ad120239bc4cecc175225c0dc18c98ca0bffe9f465133f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bece9809bf70ad158471014e9f0407932e462ce7f7864e1800e151872b48ca7
3
  size 1000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:879c433ff59d472a2c5d7c4da04ae14ac33f2ec2552c8f49d34302050bc28fb0
3
  size 1000
last-checkpoint/tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
last-checkpoint/tokenizer_config.json CHANGED
@@ -1,6 +1,46 @@
1
  {
2
  "added_tokens_decoder": {
3
- "0": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  "content": "|||IP_ADDRESS|||",
5
  "lstrip": false,
6
  "normalized": true,
@@ -8,7 +48,7 @@
8
  "single_word": false,
9
  "special": false
10
  },
11
- "1": {
12
  "content": "<|padding|>",
13
  "lstrip": false,
14
  "normalized": false,
@@ -16,7 +56,7 @@
16
  "single_word": false,
17
  "special": true
18
  },
19
- "50254": {
20
  "content": " ",
21
  "lstrip": false,
22
  "normalized": true,
@@ -24,7 +64,7 @@
24
  "single_word": false,
25
  "special": false
26
  },
27
- "50255": {
28
  "content": " ",
29
  "lstrip": false,
30
  "normalized": true,
@@ -32,7 +72,7 @@
32
  "single_word": false,
33
  "special": false
34
  },
35
- "50256": {
36
  "content": " ",
37
  "lstrip": false,
38
  "normalized": true,
@@ -40,7 +80,7 @@
40
  "single_word": false,
41
  "special": false
42
  },
43
- "50257": {
44
  "content": " ",
45
  "lstrip": false,
46
  "normalized": true,
@@ -48,7 +88,7 @@
48
  "single_word": false,
49
  "special": false
50
  },
51
- "50258": {
52
  "content": " ",
53
  "lstrip": false,
54
  "normalized": true,
@@ -56,7 +96,7 @@
56
  "single_word": false,
57
  "special": false
58
  },
59
- "50259": {
60
  "content": " ",
61
  "lstrip": false,
62
  "normalized": true,
@@ -64,7 +104,7 @@
64
  "single_word": false,
65
  "special": false
66
  },
67
- "50260": {
68
  "content": " ",
69
  "lstrip": false,
70
  "normalized": true,
@@ -72,7 +112,7 @@
72
  "single_word": false,
73
  "special": false
74
  },
75
- "50261": {
76
  "content": " ",
77
  "lstrip": false,
78
  "normalized": true,
@@ -80,7 +120,7 @@
80
  "single_word": false,
81
  "special": false
82
  },
83
- "50262": {
84
  "content": " ",
85
  "lstrip": false,
86
  "normalized": true,
@@ -88,7 +128,7 @@
88
  "single_word": false,
89
  "special": false
90
  },
91
- "50263": {
92
  "content": " ",
93
  "lstrip": false,
94
  "normalized": true,
@@ -96,7 +136,7 @@
96
  "single_word": false,
97
  "special": false
98
  },
99
- "50264": {
100
  "content": " ",
101
  "lstrip": false,
102
  "normalized": true,
@@ -104,7 +144,7 @@
104
  "single_word": false,
105
  "special": false
106
  },
107
- "50265": {
108
  "content": " ",
109
  "lstrip": false,
110
  "normalized": true,
@@ -112,7 +152,7 @@
112
  "single_word": false,
113
  "special": false
114
  },
115
- "50266": {
116
  "content": " ",
117
  "lstrip": false,
118
  "normalized": true,
@@ -120,7 +160,7 @@
120
  "single_word": false,
121
  "special": false
122
  },
123
- "50267": {
124
  "content": " ",
125
  "lstrip": false,
126
  "normalized": true,
@@ -128,7 +168,7 @@
128
  "single_word": false,
129
  "special": false
130
  },
131
- "50268": {
132
  "content": " ",
133
  "lstrip": false,
134
  "normalized": true,
@@ -136,7 +176,7 @@
136
  "single_word": false,
137
  "special": false
138
  },
139
- "50269": {
140
  "content": " ",
141
  "lstrip": false,
142
  "normalized": true,
@@ -144,7 +184,7 @@
144
  "single_word": false,
145
  "special": false
146
  },
147
- "50270": {
148
  "content": " ",
149
  "lstrip": false,
150
  "normalized": true,
@@ -152,7 +192,7 @@
152
  "single_word": false,
153
  "special": false
154
  },
155
- "50271": {
156
  "content": " ",
157
  "lstrip": false,
158
  "normalized": true,
@@ -160,7 +200,7 @@
160
  "single_word": false,
161
  "special": false
162
  },
163
- "50272": {
164
  "content": " ",
165
  "lstrip": false,
166
  "normalized": true,
@@ -168,7 +208,7 @@
168
  "single_word": false,
169
  "special": false
170
  },
171
- "50273": {
172
  "content": " ",
173
  "lstrip": false,
174
  "normalized": true,
@@ -176,7 +216,7 @@
176
  "single_word": false,
177
  "special": false
178
  },
179
- "50274": {
180
  "content": " ",
181
  "lstrip": false,
182
  "normalized": true,
@@ -184,7 +224,7 @@
184
  "single_word": false,
185
  "special": false
186
  },
187
- "50275": {
188
  "content": " ",
189
  "lstrip": false,
190
  "normalized": true,
@@ -192,7 +232,7 @@
192
  "single_word": false,
193
  "special": false
194
  },
195
- "50276": {
196
  "content": " ",
197
  "lstrip": false,
198
  "normalized": true,
@@ -200,7 +240,7 @@
200
  "single_word": false,
201
  "special": false
202
  },
203
- "50277": {
204
  "content": "|||EMAIL_ADDRESS|||",
205
  "lstrip": false,
206
  "normalized": true,
@@ -208,7 +248,7 @@
208
  "single_word": false,
209
  "special": false
210
  },
211
- "50278": {
212
  "content": "|||PHONE_NUMBER|||",
213
  "lstrip": false,
214
  "normalized": true,
@@ -216,7 +256,7 @@
216
  "single_word": false,
217
  "special": false
218
  },
219
- "50279": {
220
  "content": "<|endoftext|>",
221
  "lstrip": false,
222
  "normalized": false,
@@ -224,47 +264,7 @@
224
  "single_word": false,
225
  "special": true
226
  },
227
- "50280": {
228
- "content": "[UNK]",
229
- "lstrip": false,
230
- "normalized": false,
231
- "rstrip": false,
232
- "single_word": false,
233
- "special": true
234
- },
235
- "50281": {
236
- "content": "[CLS]",
237
- "lstrip": false,
238
- "normalized": false,
239
- "rstrip": false,
240
- "single_word": false,
241
- "special": true
242
- },
243
- "50282": {
244
- "content": "[SEP]",
245
- "lstrip": false,
246
- "normalized": false,
247
- "rstrip": false,
248
- "single_word": false,
249
- "special": true
250
- },
251
- "50283": {
252
- "content": "[PAD]",
253
- "lstrip": false,
254
- "normalized": false,
255
- "rstrip": false,
256
- "single_word": false,
257
- "special": true
258
- },
259
- "50284": {
260
- "content": "[MASK]",
261
- "lstrip": true,
262
- "normalized": false,
263
- "rstrip": false,
264
- "single_word": false,
265
- "special": true
266
- },
267
- "95580": {
268
  "content": "[unused0]",
269
  "lstrip": false,
270
  "normalized": true,
@@ -272,7 +272,7 @@
272
  "single_word": false,
273
  "special": false
274
  },
275
- "95581": {
276
  "content": "[unused1]",
277
  "lstrip": false,
278
  "normalized": true,
@@ -280,7 +280,7 @@
280
  "single_word": false,
281
  "special": false
282
  },
283
- "95582": {
284
  "content": "[unused2]",
285
  "lstrip": false,
286
  "normalized": true,
@@ -288,7 +288,7 @@
288
  "single_word": false,
289
  "special": false
290
  },
291
- "95583": {
292
  "content": "[unused3]",
293
  "lstrip": false,
294
  "normalized": true,
@@ -296,7 +296,7 @@
296
  "single_word": false,
297
  "special": false
298
  },
299
- "95584": {
300
  "content": "[unused4]",
301
  "lstrip": false,
302
  "normalized": true,
@@ -304,7 +304,7 @@
304
  "single_word": false,
305
  "special": false
306
  },
307
- "95585": {
308
  "content": "[unused5]",
309
  "lstrip": false,
310
  "normalized": true,
@@ -312,7 +312,7 @@
312
  "single_word": false,
313
  "special": false
314
  },
315
- "95586": {
316
  "content": "[unused6]",
317
  "lstrip": false,
318
  "normalized": true,
@@ -320,7 +320,7 @@
320
  "single_word": false,
321
  "special": false
322
  },
323
- "95587": {
324
  "content": "[unused7]",
325
  "lstrip": false,
326
  "normalized": true,
@@ -328,7 +328,7 @@
328
  "single_word": false,
329
  "special": false
330
  },
331
- "95588": {
332
  "content": "[unused8]",
333
  "lstrip": false,
334
  "normalized": true,
@@ -336,7 +336,7 @@
336
  "single_word": false,
337
  "special": false
338
  },
339
- "95589": {
340
  "content": "[unused9]",
341
  "lstrip": false,
342
  "normalized": true,
@@ -344,7 +344,7 @@
344
  "single_word": false,
345
  "special": false
346
  },
347
- "95590": {
348
  "content": "[unused10]",
349
  "lstrip": false,
350
  "normalized": true,
@@ -352,7 +352,7 @@
352
  "single_word": false,
353
  "special": false
354
  },
355
- "95591": {
356
  "content": "[unused11]",
357
  "lstrip": false,
358
  "normalized": true,
@@ -360,7 +360,7 @@
360
  "single_word": false,
361
  "special": false
362
  },
363
- "95592": {
364
  "content": "[unused12]",
365
  "lstrip": false,
366
  "normalized": true,
@@ -368,7 +368,7 @@
368
  "single_word": false,
369
  "special": false
370
  },
371
- "95593": {
372
  "content": "[unused13]",
373
  "lstrip": false,
374
  "normalized": true,
@@ -376,7 +376,7 @@
376
  "single_word": false,
377
  "special": false
378
  },
379
- "95594": {
380
  "content": "[unused14]",
381
  "lstrip": false,
382
  "normalized": true,
@@ -384,7 +384,7 @@
384
  "single_word": false,
385
  "special": false
386
  },
387
- "95595": {
388
  "content": "[unused15]",
389
  "lstrip": false,
390
  "normalized": true,
@@ -392,7 +392,7 @@
392
  "single_word": false,
393
  "special": false
394
  },
395
- "95596": {
396
  "content": "[unused16]",
397
  "lstrip": false,
398
  "normalized": true,
@@ -400,7 +400,7 @@
400
  "single_word": false,
401
  "special": false
402
  },
403
- "95597": {
404
  "content": "[unused17]",
405
  "lstrip": false,
406
  "normalized": true,
@@ -408,7 +408,7 @@
408
  "single_word": false,
409
  "special": false
410
  },
411
- "95598": {
412
  "content": "[unused18]",
413
  "lstrip": false,
414
  "normalized": true,
@@ -416,7 +416,7 @@
416
  "single_word": false,
417
  "special": false
418
  },
419
- "95599": {
420
  "content": "[unused19]",
421
  "lstrip": false,
422
  "normalized": true,
@@ -424,7 +424,7 @@
424
  "single_word": false,
425
  "special": false
426
  },
427
- "95600": {
428
  "content": "[unused20]",
429
  "lstrip": false,
430
  "normalized": true,
@@ -432,7 +432,7 @@
432
  "single_word": false,
433
  "special": false
434
  },
435
- "95601": {
436
  "content": "[unused21]",
437
  "lstrip": false,
438
  "normalized": true,
@@ -440,7 +440,7 @@
440
  "single_word": false,
441
  "special": false
442
  },
443
- "95602": {
444
  "content": "[unused22]",
445
  "lstrip": false,
446
  "normalized": true,
@@ -448,7 +448,7 @@
448
  "single_word": false,
449
  "special": false
450
  },
451
- "95603": {
452
  "content": "[unused23]",
453
  "lstrip": false,
454
  "normalized": true,
@@ -456,7 +456,7 @@
456
  "single_word": false,
457
  "special": false
458
  },
459
- "95604": {
460
  "content": "[unused24]",
461
  "lstrip": false,
462
  "normalized": true,
@@ -464,7 +464,7 @@
464
  "single_word": false,
465
  "special": false
466
  },
467
- "95605": {
468
  "content": "[unused25]",
469
  "lstrip": false,
470
  "normalized": true,
@@ -472,7 +472,7 @@
472
  "single_word": false,
473
  "special": false
474
  },
475
- "95606": {
476
  "content": "[unused26]",
477
  "lstrip": false,
478
  "normalized": true,
@@ -480,7 +480,7 @@
480
  "single_word": false,
481
  "special": false
482
  },
483
- "95607": {
484
  "content": "[unused27]",
485
  "lstrip": false,
486
  "normalized": true,
@@ -488,7 +488,7 @@
488
  "single_word": false,
489
  "special": false
490
  },
491
- "95608": {
492
  "content": "[unused28]",
493
  "lstrip": false,
494
  "normalized": true,
@@ -496,7 +496,7 @@
496
  "single_word": false,
497
  "special": false
498
  },
499
- "95609": {
500
  "content": "[unused29]",
501
  "lstrip": false,
502
  "normalized": true,
@@ -504,7 +504,7 @@
504
  "single_word": false,
505
  "special": false
506
  },
507
- "95610": {
508
  "content": "[unused30]",
509
  "lstrip": false,
510
  "normalized": true,
@@ -512,7 +512,7 @@
512
  "single_word": false,
513
  "special": false
514
  },
515
- "95611": {
516
  "content": "[unused31]",
517
  "lstrip": false,
518
  "normalized": true,
@@ -520,7 +520,7 @@
520
  "single_word": false,
521
  "special": false
522
  },
523
- "95612": {
524
  "content": "[unused32]",
525
  "lstrip": false,
526
  "normalized": true,
@@ -528,7 +528,7 @@
528
  "single_word": false,
529
  "special": false
530
  },
531
- "95613": {
532
  "content": "[unused33]",
533
  "lstrip": false,
534
  "normalized": true,
@@ -536,7 +536,7 @@
536
  "single_word": false,
537
  "special": false
538
  },
539
- "95614": {
540
  "content": "[unused34]",
541
  "lstrip": false,
542
  "normalized": true,
@@ -544,7 +544,7 @@
544
  "single_word": false,
545
  "special": false
546
  },
547
- "95615": {
548
  "content": "[unused35]",
549
  "lstrip": false,
550
  "normalized": true,
@@ -552,7 +552,7 @@
552
  "single_word": false,
553
  "special": false
554
  },
555
- "95616": {
556
  "content": "[unused36]",
557
  "lstrip": false,
558
  "normalized": true,
@@ -560,7 +560,7 @@
560
  "single_word": false,
561
  "special": false
562
  },
563
- "95617": {
564
  "content": "[unused37]",
565
  "lstrip": false,
566
  "normalized": true,
@@ -568,7 +568,7 @@
568
  "single_word": false,
569
  "special": false
570
  },
571
- "95618": {
572
  "content": "[unused38]",
573
  "lstrip": false,
574
  "normalized": true,
@@ -576,7 +576,7 @@
576
  "single_word": false,
577
  "special": false
578
  },
579
- "95619": {
580
  "content": "[unused39]",
581
  "lstrip": false,
582
  "normalized": true,
@@ -584,7 +584,7 @@
584
  "single_word": false,
585
  "special": false
586
  },
587
- "95620": {
588
  "content": "[unused40]",
589
  "lstrip": false,
590
  "normalized": true,
@@ -592,7 +592,7 @@
592
  "single_word": false,
593
  "special": false
594
  },
595
- "95621": {
596
  "content": "[unused41]",
597
  "lstrip": false,
598
  "normalized": true,
@@ -600,7 +600,7 @@
600
  "single_word": false,
601
  "special": false
602
  },
603
- "95622": {
604
  "content": "[unused42]",
605
  "lstrip": false,
606
  "normalized": true,
@@ -608,7 +608,7 @@
608
  "single_word": false,
609
  "special": false
610
  },
611
- "95623": {
612
  "content": "[unused43]",
613
  "lstrip": false,
614
  "normalized": true,
@@ -616,7 +616,7 @@
616
  "single_word": false,
617
  "special": false
618
  },
619
- "95624": {
620
  "content": "[unused44]",
621
  "lstrip": false,
622
  "normalized": true,
@@ -624,7 +624,7 @@
624
  "single_word": false,
625
  "special": false
626
  },
627
- "95625": {
628
  "content": "[unused45]",
629
  "lstrip": false,
630
  "normalized": true,
@@ -632,7 +632,7 @@
632
  "single_word": false,
633
  "special": false
634
  },
635
- "95626": {
636
  "content": "[unused46]",
637
  "lstrip": false,
638
  "normalized": true,
@@ -640,7 +640,7 @@
640
  "single_word": false,
641
  "special": false
642
  },
643
- "95627": {
644
  "content": "[unused47]",
645
  "lstrip": false,
646
  "normalized": true,
@@ -648,7 +648,7 @@
648
  "single_word": false,
649
  "special": false
650
  },
651
- "95628": {
652
  "content": "[unused48]",
653
  "lstrip": false,
654
  "normalized": true,
@@ -656,7 +656,7 @@
656
  "single_word": false,
657
  "special": false
658
  },
659
- "95629": {
660
  "content": "[unused49]",
661
  "lstrip": false,
662
  "normalized": true,
@@ -664,7 +664,7 @@
664
  "single_word": false,
665
  "special": false
666
  },
667
- "95630": {
668
  "content": "[unused50]",
669
  "lstrip": false,
670
  "normalized": true,
@@ -672,7 +672,7 @@
672
  "single_word": false,
673
  "special": false
674
  },
675
- "95631": {
676
  "content": "[unused51]",
677
  "lstrip": false,
678
  "normalized": true,
@@ -680,7 +680,7 @@
680
  "single_word": false,
681
  "special": false
682
  },
683
- "95632": {
684
  "content": "[unused52]",
685
  "lstrip": false,
686
  "normalized": true,
@@ -688,7 +688,7 @@
688
  "single_word": false,
689
  "special": false
690
  },
691
- "95633": {
692
  "content": "[unused53]",
693
  "lstrip": false,
694
  "normalized": true,
@@ -696,7 +696,7 @@
696
  "single_word": false,
697
  "special": false
698
  },
699
- "95634": {
700
  "content": "[unused54]",
701
  "lstrip": false,
702
  "normalized": true,
@@ -704,7 +704,7 @@
704
  "single_word": false,
705
  "special": false
706
  },
707
- "95635": {
708
  "content": "[unused55]",
709
  "lstrip": false,
710
  "normalized": true,
@@ -712,7 +712,7 @@
712
  "single_word": false,
713
  "special": false
714
  },
715
- "95636": {
716
  "content": "[unused56]",
717
  "lstrip": false,
718
  "normalized": true,
@@ -720,7 +720,7 @@
720
  "single_word": false,
721
  "special": false
722
  },
723
- "95637": {
724
  "content": "[unused57]",
725
  "lstrip": false,
726
  "normalized": true,
@@ -728,7 +728,7 @@
728
  "single_word": false,
729
  "special": false
730
  },
731
- "95638": {
732
  "content": "[unused58]",
733
  "lstrip": false,
734
  "normalized": true,
@@ -736,7 +736,7 @@
736
  "single_word": false,
737
  "special": false
738
  },
739
- "95639": {
740
  "content": "[unused59]",
741
  "lstrip": false,
742
  "normalized": true,
@@ -744,7 +744,7 @@
744
  "single_word": false,
745
  "special": false
746
  },
747
- "95640": {
748
  "content": "[unused60]",
749
  "lstrip": false,
750
  "normalized": true,
@@ -752,7 +752,7 @@
752
  "single_word": false,
753
  "special": false
754
  },
755
- "95641": {
756
  "content": "[unused61]",
757
  "lstrip": false,
758
  "normalized": true,
@@ -760,7 +760,7 @@
760
  "single_word": false,
761
  "special": false
762
  },
763
- "95642": {
764
  "content": "[unused62]",
765
  "lstrip": false,
766
  "normalized": true,
@@ -768,7 +768,7 @@
768
  "single_word": false,
769
  "special": false
770
  },
771
- "95643": {
772
  "content": "[unused63]",
773
  "lstrip": false,
774
  "normalized": true,
@@ -776,7 +776,7 @@
776
  "single_word": false,
777
  "special": false
778
  },
779
- "95644": {
780
  "content": "[unused64]",
781
  "lstrip": false,
782
  "normalized": true,
@@ -784,7 +784,7 @@
784
  "single_word": false,
785
  "special": false
786
  },
787
- "95645": {
788
  "content": "[unused65]",
789
  "lstrip": false,
790
  "normalized": true,
@@ -792,7 +792,7 @@
792
  "single_word": false,
793
  "special": false
794
  },
795
- "95646": {
796
  "content": "[unused66]",
797
  "lstrip": false,
798
  "normalized": true,
@@ -800,7 +800,7 @@
800
  "single_word": false,
801
  "special": false
802
  },
803
- "95647": {
804
  "content": "[unused67]",
805
  "lstrip": false,
806
  "normalized": true,
@@ -808,7 +808,7 @@
808
  "single_word": false,
809
  "special": false
810
  },
811
- "95648": {
812
  "content": "[unused68]",
813
  "lstrip": false,
814
  "normalized": true,
@@ -816,7 +816,7 @@
816
  "single_word": false,
817
  "special": false
818
  },
819
- "95649": {
820
  "content": "[unused69]",
821
  "lstrip": false,
822
  "normalized": true,
@@ -824,7 +824,7 @@
824
  "single_word": false,
825
  "special": false
826
  },
827
- "95650": {
828
  "content": "[unused70]",
829
  "lstrip": false,
830
  "normalized": true,
@@ -832,7 +832,7 @@
832
  "single_word": false,
833
  "special": false
834
  },
835
- "95651": {
836
  "content": "[unused71]",
837
  "lstrip": false,
838
  "normalized": true,
@@ -840,7 +840,7 @@
840
  "single_word": false,
841
  "special": false
842
  },
843
- "95652": {
844
  "content": "[unused72]",
845
  "lstrip": false,
846
  "normalized": true,
@@ -848,7 +848,7 @@
848
  "single_word": false,
849
  "special": false
850
  },
851
- "95653": {
852
  "content": "[unused73]",
853
  "lstrip": false,
854
  "normalized": true,
@@ -856,7 +856,7 @@
856
  "single_word": false,
857
  "special": false
858
  },
859
- "95654": {
860
  "content": "[unused74]",
861
  "lstrip": false,
862
  "normalized": true,
@@ -864,7 +864,7 @@
864
  "single_word": false,
865
  "special": false
866
  },
867
- "95655": {
868
  "content": "[unused75]",
869
  "lstrip": false,
870
  "normalized": true,
@@ -872,7 +872,7 @@
872
  "single_word": false,
873
  "special": false
874
  },
875
- "95656": {
876
  "content": "[unused76]",
877
  "lstrip": false,
878
  "normalized": true,
@@ -880,7 +880,7 @@
880
  "single_word": false,
881
  "special": false
882
  },
883
- "95657": {
884
  "content": "[unused77]",
885
  "lstrip": false,
886
  "normalized": true,
@@ -888,7 +888,7 @@
888
  "single_word": false,
889
  "special": false
890
  },
891
- "95658": {
892
  "content": "[unused78]",
893
  "lstrip": false,
894
  "normalized": true,
@@ -896,7 +896,7 @@
896
  "single_word": false,
897
  "special": false
898
  },
899
- "95659": {
900
  "content": "[unused79]",
901
  "lstrip": false,
902
  "normalized": true,
@@ -904,7 +904,7 @@
904
  "single_word": false,
905
  "special": false
906
  },
907
- "95660": {
908
  "content": "[unused80]",
909
  "lstrip": false,
910
  "normalized": true,
@@ -912,7 +912,7 @@
912
  "single_word": false,
913
  "special": false
914
  },
915
- "95661": {
916
  "content": "[unused81]",
917
  "lstrip": false,
918
  "normalized": true,
@@ -920,7 +920,7 @@
920
  "single_word": false,
921
  "special": false
922
  },
923
- "95662": {
924
  "content": "[unused82]",
925
  "lstrip": false,
926
  "normalized": true,
@@ -937,7 +937,7 @@
937
  "input_ids",
938
  "attention_mask"
939
  ],
940
- "model_max_length": 1000000000000000019884624838656,
941
  "pad_token": "[PAD]",
942
  "sep_token": "[SEP]",
943
  "tokenizer_class": "PreTrainedTokenizerFast",
 
1
  {
2
  "added_tokens_decoder": {
3
+ "50280": {
4
+ "content": "[UNK]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "50281": {
12
+ "content": "[CLS]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "50282": {
20
+ "content": "[SEP]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "50283": {
28
+ "content": "[PAD]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "50284": {
36
+ "content": "[MASK]",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "55000": {
44
  "content": "|||IP_ADDRESS|||",
45
  "lstrip": false,
46
  "normalized": true,
 
48
  "single_word": false,
49
  "special": false
50
  },
51
+ "55001": {
52
  "content": "<|padding|>",
53
  "lstrip": false,
54
  "normalized": false,
 
56
  "single_word": false,
57
  "special": true
58
  },
59
+ "55002": {
60
  "content": " ",
61
  "lstrip": false,
62
  "normalized": true,
 
64
  "single_word": false,
65
  "special": false
66
  },
67
+ "55003": {
68
  "content": " ",
69
  "lstrip": false,
70
  "normalized": true,
 
72
  "single_word": false,
73
  "special": false
74
  },
75
+ "55004": {
76
  "content": " ",
77
  "lstrip": false,
78
  "normalized": true,
 
80
  "single_word": false,
81
  "special": false
82
  },
83
+ "55005": {
84
  "content": " ",
85
  "lstrip": false,
86
  "normalized": true,
 
88
  "single_word": false,
89
  "special": false
90
  },
91
+ "55006": {
92
  "content": " ",
93
  "lstrip": false,
94
  "normalized": true,
 
96
  "single_word": false,
97
  "special": false
98
  },
99
+ "55007": {
100
  "content": " ",
101
  "lstrip": false,
102
  "normalized": true,
 
104
  "single_word": false,
105
  "special": false
106
  },
107
+ "55008": {
108
  "content": " ",
109
  "lstrip": false,
110
  "normalized": true,
 
112
  "single_word": false,
113
  "special": false
114
  },
115
+ "55009": {
116
  "content": " ",
117
  "lstrip": false,
118
  "normalized": true,
 
120
  "single_word": false,
121
  "special": false
122
  },
123
+ "55010": {
124
  "content": " ",
125
  "lstrip": false,
126
  "normalized": true,
 
128
  "single_word": false,
129
  "special": false
130
  },
131
+ "55011": {
132
  "content": " ",
133
  "lstrip": false,
134
  "normalized": true,
 
136
  "single_word": false,
137
  "special": false
138
  },
139
+ "55012": {
140
  "content": " ",
141
  "lstrip": false,
142
  "normalized": true,
 
144
  "single_word": false,
145
  "special": false
146
  },
147
+ "55013": {
148
  "content": " ",
149
  "lstrip": false,
150
  "normalized": true,
 
152
  "single_word": false,
153
  "special": false
154
  },
155
+ "55014": {
156
  "content": " ",
157
  "lstrip": false,
158
  "normalized": true,
 
160
  "single_word": false,
161
  "special": false
162
  },
163
+ "55015": {
164
  "content": " ",
165
  "lstrip": false,
166
  "normalized": true,
 
168
  "single_word": false,
169
  "special": false
170
  },
171
+ "55016": {
172
  "content": " ",
173
  "lstrip": false,
174
  "normalized": true,
 
176
  "single_word": false,
177
  "special": false
178
  },
179
+ "55017": {
180
  "content": " ",
181
  "lstrip": false,
182
  "normalized": true,
 
184
  "single_word": false,
185
  "special": false
186
  },
187
+ "55018": {
188
  "content": " ",
189
  "lstrip": false,
190
  "normalized": true,
 
192
  "single_word": false,
193
  "special": false
194
  },
195
+ "55019": {
196
  "content": " ",
197
  "lstrip": false,
198
  "normalized": true,
 
200
  "single_word": false,
201
  "special": false
202
  },
203
+ "55020": {
204
  "content": " ",
205
  "lstrip": false,
206
  "normalized": true,
 
208
  "single_word": false,
209
  "special": false
210
  },
211
+ "55021": {
212
  "content": " ",
213
  "lstrip": false,
214
  "normalized": true,
 
216
  "single_word": false,
217
  "special": false
218
  },
219
+ "55022": {
220
  "content": " ",
221
  "lstrip": false,
222
  "normalized": true,
 
224
  "single_word": false,
225
  "special": false
226
  },
227
+ "55023": {
228
  "content": " ",
229
  "lstrip": false,
230
  "normalized": true,
 
232
  "single_word": false,
233
  "special": false
234
  },
235
+ "55024": {
236
  "content": " ",
237
  "lstrip": false,
238
  "normalized": true,
 
240
  "single_word": false,
241
  "special": false
242
  },
243
+ "55025": {
244
  "content": "|||EMAIL_ADDRESS|||",
245
  "lstrip": false,
246
  "normalized": true,
 
248
  "single_word": false,
249
  "special": false
250
  },
251
+ "55026": {
252
  "content": "|||PHONE_NUMBER|||",
253
  "lstrip": false,
254
  "normalized": true,
 
256
  "single_word": false,
257
  "special": false
258
  },
259
+ "55027": {
260
  "content": "<|endoftext|>",
261
  "lstrip": false,
262
  "normalized": false,
 
264
  "single_word": false,
265
  "special": true
266
  },
267
+ "55028": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
268
  "content": "[unused0]",
269
  "lstrip": false,
270
  "normalized": true,
 
272
  "single_word": false,
273
  "special": false
274
  },
275
+ "55029": {
276
  "content": "[unused1]",
277
  "lstrip": false,
278
  "normalized": true,
 
280
  "single_word": false,
281
  "special": false
282
  },
283
+ "55030": {
284
  "content": "[unused2]",
285
  "lstrip": false,
286
  "normalized": true,
 
288
  "single_word": false,
289
  "special": false
290
  },
291
+ "55031": {
292
  "content": "[unused3]",
293
  "lstrip": false,
294
  "normalized": true,
 
296
  "single_word": false,
297
  "special": false
298
  },
299
+ "55032": {
300
  "content": "[unused4]",
301
  "lstrip": false,
302
  "normalized": true,
 
304
  "single_word": false,
305
  "special": false
306
  },
307
+ "55033": {
308
  "content": "[unused5]",
309
  "lstrip": false,
310
  "normalized": true,
 
312
  "single_word": false,
313
  "special": false
314
  },
315
+ "55034": {
316
  "content": "[unused6]",
317
  "lstrip": false,
318
  "normalized": true,
 
320
  "single_word": false,
321
  "special": false
322
  },
323
+ "55035": {
324
  "content": "[unused7]",
325
  "lstrip": false,
326
  "normalized": true,
 
328
  "single_word": false,
329
  "special": false
330
  },
331
+ "55036": {
332
  "content": "[unused8]",
333
  "lstrip": false,
334
  "normalized": true,
 
336
  "single_word": false,
337
  "special": false
338
  },
339
+ "55037": {
340
  "content": "[unused9]",
341
  "lstrip": false,
342
  "normalized": true,
 
344
  "single_word": false,
345
  "special": false
346
  },
347
+ "55038": {
348
  "content": "[unused10]",
349
  "lstrip": false,
350
  "normalized": true,
 
352
  "single_word": false,
353
  "special": false
354
  },
355
+ "55039": {
356
  "content": "[unused11]",
357
  "lstrip": false,
358
  "normalized": true,
 
360
  "single_word": false,
361
  "special": false
362
  },
363
+ "55040": {
364
  "content": "[unused12]",
365
  "lstrip": false,
366
  "normalized": true,
 
368
  "single_word": false,
369
  "special": false
370
  },
371
+ "55041": {
372
  "content": "[unused13]",
373
  "lstrip": false,
374
  "normalized": true,
 
376
  "single_word": false,
377
  "special": false
378
  },
379
+ "55042": {
380
  "content": "[unused14]",
381
  "lstrip": false,
382
  "normalized": true,
 
384
  "single_word": false,
385
  "special": false
386
  },
387
+ "55043": {
388
  "content": "[unused15]",
389
  "lstrip": false,
390
  "normalized": true,
 
392
  "single_word": false,
393
  "special": false
394
  },
395
+ "55044": {
396
  "content": "[unused16]",
397
  "lstrip": false,
398
  "normalized": true,
 
400
  "single_word": false,
401
  "special": false
402
  },
403
+ "55045": {
404
  "content": "[unused17]",
405
  "lstrip": false,
406
  "normalized": true,
 
408
  "single_word": false,
409
  "special": false
410
  },
411
+ "55046": {
412
  "content": "[unused18]",
413
  "lstrip": false,
414
  "normalized": true,
 
416
  "single_word": false,
417
  "special": false
418
  },
419
+ "55047": {
420
  "content": "[unused19]",
421
  "lstrip": false,
422
  "normalized": true,
 
424
  "single_word": false,
425
  "special": false
426
  },
427
+ "55048": {
428
  "content": "[unused20]",
429
  "lstrip": false,
430
  "normalized": true,
 
432
  "single_word": false,
433
  "special": false
434
  },
435
+ "55049": {
436
  "content": "[unused21]",
437
  "lstrip": false,
438
  "normalized": true,
 
440
  "single_word": false,
441
  "special": false
442
  },
443
+ "55050": {
444
  "content": "[unused22]",
445
  "lstrip": false,
446
  "normalized": true,
 
448
  "single_word": false,
449
  "special": false
450
  },
451
+ "55051": {
452
  "content": "[unused23]",
453
  "lstrip": false,
454
  "normalized": true,
 
456
  "single_word": false,
457
  "special": false
458
  },
459
+ "55052": {
460
  "content": "[unused24]",
461
  "lstrip": false,
462
  "normalized": true,
 
464
  "single_word": false,
465
  "special": false
466
  },
467
+ "55053": {
468
  "content": "[unused25]",
469
  "lstrip": false,
470
  "normalized": true,
 
472
  "single_word": false,
473
  "special": false
474
  },
475
+ "55054": {
476
  "content": "[unused26]",
477
  "lstrip": false,
478
  "normalized": true,
 
480
  "single_word": false,
481
  "special": false
482
  },
483
+ "55055": {
484
  "content": "[unused27]",
485
  "lstrip": false,
486
  "normalized": true,
 
488
  "single_word": false,
489
  "special": false
490
  },
491
+ "55056": {
492
  "content": "[unused28]",
493
  "lstrip": false,
494
  "normalized": true,
 
496
  "single_word": false,
497
  "special": false
498
  },
499
+ "55057": {
500
  "content": "[unused29]",
501
  "lstrip": false,
502
  "normalized": true,
 
504
  "single_word": false,
505
  "special": false
506
  },
507
+ "55058": {
508
  "content": "[unused30]",
509
  "lstrip": false,
510
  "normalized": true,
 
512
  "single_word": false,
513
  "special": false
514
  },
515
+ "55059": {
516
  "content": "[unused31]",
517
  "lstrip": false,
518
  "normalized": true,
 
520
  "single_word": false,
521
  "special": false
522
  },
523
+ "55060": {
524
  "content": "[unused32]",
525
  "lstrip": false,
526
  "normalized": true,
 
528
  "single_word": false,
529
  "special": false
530
  },
531
+ "55061": {
532
  "content": "[unused33]",
533
  "lstrip": false,
534
  "normalized": true,
 
536
  "single_word": false,
537
  "special": false
538
  },
539
+ "55062": {
540
  "content": "[unused34]",
541
  "lstrip": false,
542
  "normalized": true,
 
544
  "single_word": false,
545
  "special": false
546
  },
547
+ "55063": {
548
  "content": "[unused35]",
549
  "lstrip": false,
550
  "normalized": true,
 
552
  "single_word": false,
553
  "special": false
554
  },
555
+ "55064": {
556
  "content": "[unused36]",
557
  "lstrip": false,
558
  "normalized": true,
 
560
  "single_word": false,
561
  "special": false
562
  },
563
+ "55065": {
564
  "content": "[unused37]",
565
  "lstrip": false,
566
  "normalized": true,
 
568
  "single_word": false,
569
  "special": false
570
  },
571
+ "55066": {
572
  "content": "[unused38]",
573
  "lstrip": false,
574
  "normalized": true,
 
576
  "single_word": false,
577
  "special": false
578
  },
579
+ "55067": {
580
  "content": "[unused39]",
581
  "lstrip": false,
582
  "normalized": true,
 
584
  "single_word": false,
585
  "special": false
586
  },
587
+ "55068": {
588
  "content": "[unused40]",
589
  "lstrip": false,
590
  "normalized": true,
 
592
  "single_word": false,
593
  "special": false
594
  },
595
+ "55069": {
596
  "content": "[unused41]",
597
  "lstrip": false,
598
  "normalized": true,
 
600
  "single_word": false,
601
  "special": false
602
  },
603
+ "55070": {
604
  "content": "[unused42]",
605
  "lstrip": false,
606
  "normalized": true,
 
608
  "single_word": false,
609
  "special": false
610
  },
611
+ "55071": {
612
  "content": "[unused43]",
613
  "lstrip": false,
614
  "normalized": true,
 
616
  "single_word": false,
617
  "special": false
618
  },
619
+ "55072": {
620
  "content": "[unused44]",
621
  "lstrip": false,
622
  "normalized": true,
 
624
  "single_word": false,
625
  "special": false
626
  },
627
+ "55073": {
628
  "content": "[unused45]",
629
  "lstrip": false,
630
  "normalized": true,
 
632
  "single_word": false,
633
  "special": false
634
  },
635
+ "55074": {
636
  "content": "[unused46]",
637
  "lstrip": false,
638
  "normalized": true,
 
640
  "single_word": false,
641
  "special": false
642
  },
643
+ "55075": {
644
  "content": "[unused47]",
645
  "lstrip": false,
646
  "normalized": true,
 
648
  "single_word": false,
649
  "special": false
650
  },
651
+ "55076": {
652
  "content": "[unused48]",
653
  "lstrip": false,
654
  "normalized": true,
 
656
  "single_word": false,
657
  "special": false
658
  },
659
+ "55077": {
660
  "content": "[unused49]",
661
  "lstrip": false,
662
  "normalized": true,
 
664
  "single_word": false,
665
  "special": false
666
  },
667
+ "55078": {
668
  "content": "[unused50]",
669
  "lstrip": false,
670
  "normalized": true,
 
672
  "single_word": false,
673
  "special": false
674
  },
675
+ "55079": {
676
  "content": "[unused51]",
677
  "lstrip": false,
678
  "normalized": true,
 
680
  "single_word": false,
681
  "special": false
682
  },
683
+ "55080": {
684
  "content": "[unused52]",
685
  "lstrip": false,
686
  "normalized": true,
 
688
  "single_word": false,
689
  "special": false
690
  },
691
+ "55081": {
692
  "content": "[unused53]",
693
  "lstrip": false,
694
  "normalized": true,
 
696
  "single_word": false,
697
  "special": false
698
  },
699
+ "55082": {
700
  "content": "[unused54]",
701
  "lstrip": false,
702
  "normalized": true,
 
704
  "single_word": false,
705
  "special": false
706
  },
707
+ "55083": {
708
  "content": "[unused55]",
709
  "lstrip": false,
710
  "normalized": true,
 
712
  "single_word": false,
713
  "special": false
714
  },
715
+ "55084": {
716
  "content": "[unused56]",
717
  "lstrip": false,
718
  "normalized": true,
 
720
  "single_word": false,
721
  "special": false
722
  },
723
+ "55085": {
724
  "content": "[unused57]",
725
  "lstrip": false,
726
  "normalized": true,
 
728
  "single_word": false,
729
  "special": false
730
  },
731
+ "55086": {
732
  "content": "[unused58]",
733
  "lstrip": false,
734
  "normalized": true,
 
736
  "single_word": false,
737
  "special": false
738
  },
739
+ "55087": {
740
  "content": "[unused59]",
741
  "lstrip": false,
742
  "normalized": true,
 
744
  "single_word": false,
745
  "special": false
746
  },
747
+ "55088": {
748
  "content": "[unused60]",
749
  "lstrip": false,
750
  "normalized": true,
 
752
  "single_word": false,
753
  "special": false
754
  },
755
+ "55089": {
756
  "content": "[unused61]",
757
  "lstrip": false,
758
  "normalized": true,
 
760
  "single_word": false,
761
  "special": false
762
  },
763
+ "55090": {
764
  "content": "[unused62]",
765
  "lstrip": false,
766
  "normalized": true,
 
768
  "single_word": false,
769
  "special": false
770
  },
771
+ "55091": {
772
  "content": "[unused63]",
773
  "lstrip": false,
774
  "normalized": true,
 
776
  "single_word": false,
777
  "special": false
778
  },
779
+ "55092": {
780
  "content": "[unused64]",
781
  "lstrip": false,
782
  "normalized": true,
 
784
  "single_word": false,
785
  "special": false
786
  },
787
+ "55093": {
788
  "content": "[unused65]",
789
  "lstrip": false,
790
  "normalized": true,
 
792
  "single_word": false,
793
  "special": false
794
  },
795
+ "55094": {
796
  "content": "[unused66]",
797
  "lstrip": false,
798
  "normalized": true,
 
800
  "single_word": false,
801
  "special": false
802
  },
803
+ "55095": {
804
  "content": "[unused67]",
805
  "lstrip": false,
806
  "normalized": true,
 
808
  "single_word": false,
809
  "special": false
810
  },
811
+ "55096": {
812
  "content": "[unused68]",
813
  "lstrip": false,
814
  "normalized": true,
 
816
  "single_word": false,
817
  "special": false
818
  },
819
+ "55097": {
820
  "content": "[unused69]",
821
  "lstrip": false,
822
  "normalized": true,
 
824
  "single_word": false,
825
  "special": false
826
  },
827
+ "55098": {
828
  "content": "[unused70]",
829
  "lstrip": false,
830
  "normalized": true,
 
832
  "single_word": false,
833
  "special": false
834
  },
835
+ "55099": {
836
  "content": "[unused71]",
837
  "lstrip": false,
838
  "normalized": true,
 
840
  "single_word": false,
841
  "special": false
842
  },
843
+ "55100": {
844
  "content": "[unused72]",
845
  "lstrip": false,
846
  "normalized": true,
 
848
  "single_word": false,
849
  "special": false
850
  },
851
+ "55101": {
852
  "content": "[unused73]",
853
  "lstrip": false,
854
  "normalized": true,
 
856
  "single_word": false,
857
  "special": false
858
  },
859
+ "55102": {
860
  "content": "[unused74]",
861
  "lstrip": false,
862
  "normalized": true,
 
864
  "single_word": false,
865
  "special": false
866
  },
867
+ "55103": {
868
  "content": "[unused75]",
869
  "lstrip": false,
870
  "normalized": true,
 
872
  "single_word": false,
873
  "special": false
874
  },
875
+ "55104": {
876
  "content": "[unused76]",
877
  "lstrip": false,
878
  "normalized": true,
 
880
  "single_word": false,
881
  "special": false
882
  },
883
+ "55105": {
884
  "content": "[unused77]",
885
  "lstrip": false,
886
  "normalized": true,
 
888
  "single_word": false,
889
  "special": false
890
  },
891
+ "55106": {
892
  "content": "[unused78]",
893
  "lstrip": false,
894
  "normalized": true,
 
896
  "single_word": false,
897
  "special": false
898
  },
899
+ "55107": {
900
  "content": "[unused79]",
901
  "lstrip": false,
902
  "normalized": true,
 
904
  "single_word": false,
905
  "special": false
906
  },
907
+ "55108": {
908
  "content": "[unused80]",
909
  "lstrip": false,
910
  "normalized": true,
 
912
  "single_word": false,
913
  "special": false
914
  },
915
+ "55109": {
916
  "content": "[unused81]",
917
  "lstrip": false,
918
  "normalized": true,
 
920
  "single_word": false,
921
  "special": false
922
  },
923
+ "55110": {
924
  "content": "[unused82]",
925
  "lstrip": false,
926
  "normalized": true,
 
937
  "input_ids",
938
  "attention_mask"
939
  ],
940
+ "model_max_length": 8192,
941
  "pad_token": "[PAD]",
942
  "sep_token": "[SEP]",
943
  "tokenizer_class": "PreTrainedTokenizerFast",
last-checkpoint/trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff