mosesdaudu commited on
Commit
2c56376
·
verified ·
1 Parent(s): 6bc9010

Training in progress, step 100

Browse files
adapter_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "DAMO-NLP-MT/polylm-1.7b",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layers_pattern": null,
10
+ "layers_to_transform": null,
11
+ "loftq_config": {},
12
+ "lora_alpha": 16,
13
+ "lora_dropout": 0.1,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 4,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "c_attn"
23
+ ],
24
+ "task_type": "CAUSAL_LM",
25
+ "use_rslora": false
26
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660de157d33bf0576056f912000fbbaa549bb94f6d0e023fdc083bf8128b0a4d
3
+ size 3151856
special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "</s>",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer.json ADDED
@@ -0,0 +1,922 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 128,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 128
12
+ },
13
+ "direction": "Left",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 2,
16
+ "pad_type_id": 0,
17
+ "pad_token": "</s>"
18
+ },
19
+ "added_tokens": [
20
+ {
21
+ "id": 0,
22
+ "content": "<unk>",
23
+ "single_word": false,
24
+ "lstrip": false,
25
+ "rstrip": false,
26
+ "normalized": true,
27
+ "special": true
28
+ },
29
+ {
30
+ "id": 1,
31
+ "content": "<s>",
32
+ "single_word": false,
33
+ "lstrip": false,
34
+ "rstrip": false,
35
+ "normalized": true,
36
+ "special": true
37
+ },
38
+ {
39
+ "id": 2,
40
+ "content": "</s>",
41
+ "single_word": false,
42
+ "lstrip": false,
43
+ "rstrip": false,
44
+ "normalized": true,
45
+ "special": true
46
+ }
47
+ ],
48
+ "normalizer": {
49
+ "type": "Sequence",
50
+ "normalizers": [
51
+ {
52
+ "type": "Prepend",
53
+ "prepend": "▁"
54
+ },
55
+ {
56
+ "type": "Replace",
57
+ "pattern": {
58
+ "String": " "
59
+ },
60
+ "content": "▁"
61
+ }
62
+ ]
63
+ },
64
+ "pre_tokenizer": null,
65
+ "post_processor": {
66
+ "type": "TemplateProcessing",
67
+ "single": [
68
+ {
69
+ "SpecialToken": {
70
+ "id": "<s>",
71
+ "type_id": 0
72
+ }
73
+ },
74
+ {
75
+ "Sequence": {
76
+ "id": "A",
77
+ "type_id": 0
78
+ }
79
+ }
80
+ ],
81
+ "pair": [
82
+ {
83
+ "SpecialToken": {
84
+ "id": "<s>",
85
+ "type_id": 0
86
+ }
87
+ },
88
+ {
89
+ "Sequence": {
90
+ "id": "A",
91
+ "type_id": 0
92
+ }
93
+ },
94
+ {
95
+ "SpecialToken": {
96
+ "id": "<s>",
97
+ "type_id": 1
98
+ }
99
+ },
100
+ {
101
+ "Sequence": {
102
+ "id": "B",
103
+ "type_id": 1
104
+ }
105
+ }
106
+ ],
107
+ "special_tokens": {
108
+ "<s>": {
109
+ "id": "<s>",
110
+ "ids": [
111
+ 1
112
+ ],
113
+ "tokens": [
114
+ "<s>"
115
+ ]
116
+ }
117
+ }
118
+ },
119
+ "decoder": {
120
+ "type": "Sequence",
121
+ "decoders": [
122
+ {
123
+ "type": "Replace",
124
+ "pattern": {
125
+ "String": "▁"
126
+ },
127
+ "content": " "
128
+ },
129
+ {
130
+ "type": "ByteFallback"
131
+ },
132
+ {
133
+ "type": "Fuse"
134
+ },
135
+ {
136
+ "type": "Strip",
137
+ "content": " ",
138
+ "start": 1,
139
+ "stop": 0
140
+ }
141
+ ]
142
+ },
143
+ "model": {
144
+ "type": "Unigram",
145
+ "unk_id": 0,
146
+ "vocab": [
147
+ [
148
+ "<unk>",
149
+ 0.0
150
+ ],
151
+ [
152
+ "<s>",
153
+ 0.0
154
+ ],
155
+ [
156
+ "</s>",
157
+ 0.0
158
+ ],
159
+ [
160
+ "▁",
161
+ -0.5537281368002951
162
+ ],
163
+ [
164
+ "a",
165
+ -2.206163300308619
166
+ ],
167
+ [
168
+ "i",
169
+ -3.4698377124275996
170
+ ],
171
+ [
172
+ "o",
173
+ -3.625328505181651
174
+ ],
175
+ [
176
+ "d",
177
+ -3.710261874841528
178
+ ],
179
+ [
180
+ "y",
181
+ -3.895623014599913
182
+ ],
183
+ [
184
+ "n",
185
+ -3.9241564889678657
186
+ ],
187
+ [
188
+ "e",
189
+ -3.996031612968597
190
+ ],
191
+ [
192
+ "u",
193
+ -4.020550100040991
194
+ ],
195
+ [
196
+ "l",
197
+ -4.16796601703772
198
+ ],
199
+ [
200
+ "h",
201
+ -4.2061951544872755
202
+ ],
203
+ [
204
+ "s",
205
+ -4.258920876199081
206
+ ],
207
+ [
208
+ "k",
209
+ -4.270646474711075
210
+ ],
211
+ [
212
+ "r",
213
+ -4.366133846179466
214
+ ],
215
+ [
216
+ "m",
217
+ -4.661349427160829
218
+ ],
219
+ [
220
+ "g",
221
+ -4.671853885731711
222
+ ],
223
+ [
224
+ "b",
225
+ -4.764145142326377
226
+ ],
227
+ [
228
+ "w",
229
+ -5.020700862179128
230
+ ],
231
+ [
232
+ "t",
233
+ -5.039283250304928
234
+ ],
235
+ [
236
+ "x",
237
+ -5.041020067562583
238
+ ],
239
+ [
240
+ "q",
241
+ -5.565562390890502
242
+ ],
243
+ [
244
+ "c",
245
+ -5.627498296064616
246
+ ],
247
+ [
248
+ ",",
249
+ -5.821637688768487
250
+ ],
251
+ [
252
+ ".",
253
+ -6.056015545727806
254
+ ],
255
+ [
256
+ "S",
257
+ -6.224462278190527
258
+ ],
259
+ [
260
+ "f",
261
+ -6.228092265837139
262
+ ],
263
+ [
264
+ "M",
265
+ -6.305043609360995
266
+ ],
267
+ [
268
+ "j",
269
+ -6.4046242021046815
270
+ ],
271
+ [
272
+ "A",
273
+ -6.618608152829582
274
+ ],
275
+ [
276
+ "D",
277
+ -6.767235971284624
278
+ ],
279
+ [
280
+ "W",
281
+ -6.784002580071416
282
+ ],
283
+ [
284
+ "C",
285
+ -6.975347072856344
286
+ ],
287
+ [
288
+ "I",
289
+ -7.094522631592117
290
+ ],
291
+ [
292
+ "G",
293
+ -7.12377731380807
294
+ ],
295
+ [
296
+ "-",
297
+ -7.163134595285085
298
+ ],
299
+ [
300
+ "B",
301
+ -7.185302221532661
302
+ ],
303
+ [
304
+ "K",
305
+ -7.284107055272177
306
+ ],
307
+ [
308
+ "X",
309
+ -7.345178282504843
310
+ ],
311
+ [
312
+ "H",
313
+ -7.441136939513969
314
+ ],
315
+ [
316
+ "0",
317
+ -7.610454725175899
318
+ ],
319
+ [
320
+ "1",
321
+ -7.676846365553844
322
+ ],
323
+ [
324
+ "Q",
325
+ -7.6815023490292225
326
+ ],
327
+ [
328
+ "2",
329
+ -7.832934400654507
330
+ ],
331
+ [
332
+ "O",
333
+ -7.855510099432444
334
+ ],
335
+ [
336
+ "’",
337
+ -7.913303956478877
338
+ ],
339
+ [
340
+ "T",
341
+ -7.920521835325051
342
+ ],
343
+ [
344
+ "N",
345
+ -7.927129060971368
346
+ ],
347
+ [
348
+ "L",
349
+ -7.946540647005372
350
+ ],
351
+ [
352
+ "F",
353
+ -8.030392557146758
354
+ ],
355
+ [
356
+ "J",
357
+ -8.044456444862213
358
+ ],
359
+ [
360
+ "R",
361
+ -8.061750108119739
362
+ ],
363
+ [
364
+ "U",
365
+ -8.168080202728104
366
+ ],
367
+ [
368
+ "E",
369
+ -8.322863716456041
370
+ ],
371
+ [
372
+ ":",
373
+ -8.419997311703058
374
+ ],
375
+ [
376
+ ")",
377
+ -8.515578814777218
378
+ ],
379
+ [
380
+ "P",
381
+ -8.547115687654244
382
+ ],
383
+ [
384
+ "Y",
385
+ -8.550819395121305
386
+ ],
387
+ [
388
+ "(",
389
+ -8.564518237708931
390
+ ],
391
+ [
392
+ "\"",
393
+ -8.768258741460592
394
+ ],
395
+ [
396
+ "p",
397
+ -8.841598353802134
398
+ ],
399
+ [
400
+ "3",
401
+ -8.84491235773391
402
+ ],
403
+ [
404
+ "“",
405
+ -8.848237380812833
406
+ ],
407
+ [
408
+ "'",
409
+ -8.861649146182236
410
+ ],
411
+ [
412
+ "5",
413
+ -8.90475925914842
414
+ ],
415
+ [
416
+ "9",
417
+ -8.91005962353548
418
+ ],
419
+ [
420
+ "4",
421
+ -8.957212497597583
422
+ ],
423
+ [
424
+ "”",
425
+ -8.975957183394758
426
+ ],
427
+ [
428
+ "/",
429
+ -8.979748655995529
430
+ ],
431
+ [
432
+ "8",
433
+ -9.062882529049046
434
+ ],
435
+ [
436
+ "7",
437
+ -9.064948644751524
438
+ ],
439
+ [
440
+ "6",
441
+ -9.1513021242946
442
+ ],
443
+ [
444
+ "?",
445
+ -9.42740162082142
446
+ ],
447
+ [
448
+ "v",
449
+ -9.473002191090902
450
+ ],
451
+ [
452
+ "…",
453
+ -9.722540553349848
454
+ ],
455
+ [
456
+ "–",
457
+ -10.13702742185092
458
+ ],
459
+ [
460
+ "z",
461
+ -10.13702742185092
462
+ ],
463
+ [
464
+ "V",
465
+ -10.286656086276462
466
+ ],
467
+ [
468
+ ";",
469
+ -10.307933395522006
470
+ ],
471
+ [
472
+ "[",
473
+ -10.43788633130764
474
+ ],
475
+ [
476
+ "]",
477
+ -10.496726484580272
478
+ ],
479
+ [
480
+ "!",
481
+ -10.496726484580272
482
+ ],
483
+ [
484
+ "Z",
485
+ -10.797478062315149
486
+ ],
487
+ [
488
+ "_",
489
+ -10.821147530102262
490
+ ],
491
+ [
492
+ "&",
493
+ -10.895715264505524
494
+ ],
495
+ [
496
+ "‘",
497
+ -11.160012056497354
498
+ ],
499
+ [
500
+ "%",
501
+ -11.176961209039728
502
+ ],
503
+ [
504
+ "$",
505
+ -11.544672763846052
506
+ ],
507
+ [
508
+ "+",
509
+ -11.705005812336996
510
+ ],
511
+ [
512
+ "`",
513
+ -12.00725762502892
514
+ ],
515
+ [
516
+ "»",
517
+ -12.04725762502892
518
+ ],
519
+ [
520
+ "ل",
521
+ -12.088924291695587
522
+ ],
523
+ [
524
+ "ا",
525
+ -12.132402552565154
526
+ ],
527
+ [
528
+ "—",
529
+ -12.132402552565154
530
+ ],
531
+ [
532
+ "​",
533
+ -12.225476145638746
534
+ ],
535
+ [
536
+ "*",
537
+ -12.225476145638746
538
+ ],
539
+ [
540
+ "«",
541
+ -12.504986809553444
542
+ ],
543
+ [
544
+ "�",
545
+ -12.504986809553444
546
+ ],
547
+ [
548
+ "€",
549
+ -12.64308204764871
550
+ ],
551
+ [
552
+ "\\",
553
+ -12.803338457905266
554
+ ],
555
+ [
556
+ "ö",
557
+ -12.803338457905266
558
+ ],
559
+ [
560
+ "م",
561
+ -13.105358659928983
562
+ ],
563
+ [
564
+ "•",
565
+ -13.105358659928983
566
+ ],
567
+ [
568
+ "ä",
569
+ -13.230358659938087
570
+ ],
571
+ [
572
+ "ي",
573
+ -13.230358659938087
574
+ ],
575
+ [
576
+ "}",
577
+ -13.230358659938087
578
+ ],
579
+ [
580
+ "ه",
581
+ -13.373215802835192
582
+ ],
583
+ [
584
+ "ن",
585
+ -13.373215802835192
586
+ ],
587
+ [
588
+ "â",
589
+ -13.373215802835192
590
+ ],
591
+ [
592
+ "{",
593
+ -13.373215802835192
594
+ ],
595
+ [
596
+ "=",
597
+ -13.373215802835192
598
+ ],
599
+ [
600
+ "@",
601
+ -13.373215802835192
602
+ ],
603
+ [
604
+ "→",
605
+ -13.373215802835192
606
+ ],
607
+ [
608
+ "←",
609
+ -13.539882469501858
610
+ ],
611
+ [
612
+ "و",
613
+ -13.539882469501858
614
+ ],
615
+ [
616
+ "ع",
617
+ -13.73988246950186
618
+ ],
619
+ [
620
+ "£",
621
+ -13.73988246950186
622
+ ],
623
+ [
624
+ "·",
625
+ -13.73988246950186
626
+ ],
627
+ [
628
+ "س",
629
+ -13.73988246950186
630
+ ],
631
+ [
632
+ "^",
633
+ -13.73988246950186
634
+ ],
635
+ [
636
+ "ø",
637
+ -13.73988246950186
638
+ ],
639
+ [
640
+ "ر",
641
+ -13.73988246950186
642
+ ],
643
+ [
644
+ "´",
645
+ -13.73988246950186
646
+ ],
647
+ [
648
+ "ف",
649
+ -13.98988246950186
650
+ ],
651
+ [
652
+ "ص",
653
+ -13.98988246950186
654
+ ],
655
+ [
656
+ "é",
657
+ -13.98988246950186
658
+ ],
659
+ [
660
+ "œ",
661
+ -13.98988246950186
662
+ ],
663
+ [
664
+ "è",
665
+ -13.98988246950186
666
+ ],
667
+ [
668
+ "ح",
669
+ -14.323215802835191
670
+ ],
671
+ [
672
+ "á",
673
+ -14.323215802835191
674
+ ],
675
+ [
676
+ "í",
677
+ -14.323215802835191
678
+ ],
679
+ [
680
+ "„",
681
+ -14.323215802835191
682
+ ],
683
+ [
684
+ "Ø",
685
+ -14.323215802835191
686
+ ],
687
+ [
688
+ "ك",
689
+ -14.323215802835191
690
+ ],
691
+ [
692
+ "ü",
693
+ -14.823215802835191
694
+ ],
695
+ [
696
+ "<",
697
+ -14.823215802835191
698
+ ],
699
+ [
700
+ "أ",
701
+ -14.823215802835191
702
+ ],
703
+ [
704
+ "ُ",
705
+ -14.823215802835191
706
+ ],
707
+ [
708
+ "ى",
709
+ -14.823215802835191
710
+ ],
711
+ [
712
+ "፡",
713
+ -14.823215802835191
714
+ ],
715
+ [
716
+ "²",
717
+ -14.823215802835191
718
+ ],
719
+ [
720
+ "د",
721
+ -14.823215802835191
722
+ ],
723
+ [
724
+ "ء",
725
+ -14.823215802835191
726
+ ],
727
+ [
728
+ "ʼ",
729
+ -14.823215802835191
730
+ ],
731
+ [
732
+ "ب",
733
+ -14.823215802835191
734
+ ],
735
+ [
736
+ "­",
737
+ -14.823215802835191
738
+ ],
739
+ [
740
+ "",
741
+ -14.823215802835191
742
+ ],
743
+ [
744
+ "ط",
745
+ -15.823215802835191
746
+ ],
747
+ [
748
+ "职",
749
+ -15.823215802835191
750
+ ],
751
+ [
752
+ "å",
753
+ -15.823215802835191
754
+ ],
755
+ [
756
+ "ﷺ",
757
+ -15.823215802835191
758
+ ],
759
+ [
760
+ "业",
761
+ -15.823215802835191
762
+ ],
763
+ [
764
+ "”",
765
+ -15.823215802835191
766
+ ],
767
+ [
768
+ "ə",
769
+ -15.823215802835191
770
+ ],
771
+ [
772
+ "川",
773
+ -15.823215802835191
774
+ ],
775
+ [
776
+ "‎",
777
+ -15.823215802835191
778
+ ],
779
+ [
780
+ "ق",
781
+ -15.823215802835191
782
+ ],
783
+ [
784
+ "ē",
785
+ -15.823215802835191
786
+ ],
787
+ [
788
+ "‐",
789
+ -15.823215802835191
790
+ ],
791
+ [
792
+ "#",
793
+ -15.823215802835191
794
+ ],
795
+ [
796
+ "“",
797
+ -15.823215802835191
798
+ ],
799
+ [
800
+ "×",
801
+ -15.823215802835191
802
+ ],
803
+ [
804
+ "ï",
805
+ -15.823215802835191
806
+ ],
807
+ [
808
+ "ñ",
809
+ -15.823215802835191
810
+ ],
811
+ [
812
+ "─",
813
+ -15.823215802835191
814
+ ],
815
+ [
816
+ "®",
817
+ -15.823215802835191
818
+ ],
819
+ [
820
+ "ذ",
821
+ -15.823215802835191
822
+ ],
823
+ [
824
+ "ش",
825
+ -15.823215802835191
826
+ ],
827
+ [
828
+ "四",
829
+ -15.823215802835191
830
+ ],
831
+ [
832
+ "ج",
833
+ -15.823215802835191
834
+ ],
835
+ [
836
+ "↑",
837
+ -15.823215802835191
838
+ ],
839
+ [
840
+ "غ",
841
+ -15.823215802835191
842
+ ],
843
+ [
844
+ "传",
845
+ -15.823215802835191
846
+ ],
847
+ [
848
+ "媒",
849
+ -15.823215802835191
850
+ ],
851
+ [
852
+ "院",
853
+ -15.823215802835191
854
+ ],
855
+ [
856
+ "ë",
857
+ -15.823215802835191
858
+ ],
859
+ [
860
+ "学",
861
+ -15.823215802835191
862
+ ],
863
+ [
864
+ "ş",
865
+ -15.823215802835191
866
+ ],
867
+ [
868
+ "™",
869
+ -15.823215802835191
870
+ ],
871
+ [
872
+ "ğ",
873
+ -15.823215802835191
874
+ ],
875
+ [
876
+ "‏",
877
+ -15.823215802835191
878
+ ],
879
+ [
880
+ "ą",
881
+ -15.823215802835191
882
+ ],
883
+ [
884
+ "ç",
885
+ -15.823215802835191
886
+ ],
887
+ [
888
+ "ث",
889
+ -15.823215802835191
890
+ ],
891
+ [
892
+ "ت",
893
+ -15.823215802835191
894
+ ],
895
+ [
896
+ "ó",
897
+ -15.823215802835191
898
+ ],
899
+ [
900
+ "文",
901
+ -15.823215802835191
902
+ ],
903
+ [
904
+ "ã",
905
+ -15.823215802835191
906
+ ],
907
+ [
908
+ "化",
909
+ -15.823215802835191
910
+ ],
911
+ [
912
+ " ",
913
+ -15.823215802835191
914
+ ],
915
+ [
916
+ ">",
917
+ -15.823215802835191
918
+ ]
919
+ ],
920
+ "byte_fallback": false
921
+ }
922
+ }
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63639ba62c4af921cb7c373630bee7d45568fc5ff7a98add756e8aa57df59065
3
+ size 4754121
tokenizer_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<unk>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": true,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": true,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ }
29
+ },
30
+ "bos_token": "<s>",
31
+ "clean_up_tokenization_spaces": false,
32
+ "eos_token": "</s>",
33
+ "legacy": true,
34
+ "model_max_length": 2048,
35
+ "pad_token": "</s>",
36
+ "sp_model_kwargs": {},
37
+ "spaces_between_special_tokens": false,
38
+ "tokenizer_class": "LlamaTokenizer",
39
+ "unk_token": "<unk>",
40
+ "use_default_system_prompt": false
41
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82366e64111569909774e767935d25c38b0d6ebd06ea52858b8383b218e1f2be
3
+ size 4664