benitoals commited on
Commit
4c07f8f
Β·
verified Β·
1 Parent(s): 06e8c85

Model save

Browse files
Files changed (32) hide show
  1. .gitattributes +1 -0
  2. README.md +223 -0
  3. adapter_config.json +32 -0
  4. adapter_model.safetensors +3 -0
  5. runs/Mar10_23-08-48_1412920010036/events.out.tfevents.1741662535.1412920010036.5471.0 +3 -0
  6. runs/Mar10_23-08-48_1412920010036/events.out.tfevents.1741667746.1412920010036.5471.1 +3 -0
  7. runs/Mar11_00-36-23_1412920010036/events.out.tfevents.1741667784.1412920010036.5471.2 +3 -0
  8. runs/Mar11_00-36-23_1412920010036/events.out.tfevents.1741668489.1412920010036.5471.3 +3 -0
  9. runs/Mar11_00-48-17_1412920010036/events.out.tfevents.1741668498.1412920010036.5471.4 +3 -0
  10. runs/Mar11_00-48-17_1412920010036/events.out.tfevents.1741673649.1412920010036.5471.5 +3 -0
  11. runs/Mar11_08-18-41_1412920010036/events.out.tfevents.1741695522.1412920010036.235349.0 +3 -0
  12. runs/Mar11_08-36-50_1412920010036/events.out.tfevents.1741696613.1412920010036.243166.0 +3 -0
  13. runs/Mar11_08-36-50_1412920010036/events.out.tfevents.1741706871.1412920010036.243166.1 +3 -0
  14. runs/Mar11_11-28-33_1412920010036/events.out.tfevents.1741706915.1412920010036.243166.2 +3 -0
  15. runs/Mar11_11-28-33_1412920010036/events.out.tfevents.1741708827.1412920010036.243166.3 +3 -0
  16. runs/Mar11_12-01-09_1412920010036/events.out.tfevents.1741708871.1412920010036.243166.4 +3 -0
  17. runs/Mar11_12-01-09_1412920010036/events.out.tfevents.1741719010.1412920010036.243166.5 +3 -0
  18. runs/Mar16_11-09-16_1412920010036/events.out.tfevents.1742137758.1412920010036.2788175.0 +3 -0
  19. runs/Mar16_11-09-16_1412920010036/events.out.tfevents.1742153024.1412920010036.2788175.1 +3 -0
  20. runs/Mar16_15-24-22_1412920010036/events.out.tfevents.1742153062.1412920010036.2788175.2 +3 -0
  21. runs/Mar16_15-24-22_1412920010036/events.out.tfevents.1742156125.1412920010036.2788175.3 +3 -0
  22. runs/Mar16_16-16-04_1412920010036/events.out.tfevents.1742156165.1412920010036.2788175.4 +3 -0
  23. runs/Mar16_16-16-04_1412920010036/events.out.tfevents.1742171274.1412920010036.2788175.5 +3 -0
  24. runs/Mar16_20-40-24_1412920010036/events.out.tfevents.1742172027.1412920010036.3060254.0 +3 -0
  25. runs/Mar17_07-22-30_1412920010036/events.out.tfevents.1742210552.1412920010036.3303252.0 +3 -0
  26. runs/Mar17_07-22-30_1412920010036/events.out.tfevents.1742223668.1412920010036.3303252.1 +3 -0
  27. runs/Mar17_11-02-11_1412920010036/events.out.tfevents.1742223732.1412920010036.3303252.2 +3 -0
  28. special_tokens_map.json +23 -0
  29. spiece.model +3 -0
  30. tokenizer.json +3 -0
  31. tokenizer_config.json +840 -0
  32. training_args.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ license: apache-2.0
4
+ base_model: google/mt5-base
5
+ tags:
6
+ - generated_from_trainer
7
+ metrics:
8
+ - rouge
9
+ model-index:
10
+ - name: base-lora-hf
11
+ results: []
12
+ ---
13
+
14
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
+ should probably proofread and complete it, then remove this comment. -->
16
+
17
+ # base-lora-hf
18
+
19
+ This model is a fine-tuned version of [google/mt5-base](https://huggingface.co/google/mt5-base) on an unknown dataset.
20
+ It achieves the following results on the evaluation set:
21
+ - Loss: 4.9672
22
+ - Rouge1: 5.3819
23
+ - Rouge2: 0.5196
24
+ - Rougel: 4.7713
25
+ - Rougelsum: 4.7866
26
+
27
+ ## Model description
28
+
29
+ More information needed
30
+
31
+ ## Intended uses & limitations
32
+
33
+ More information needed
34
+
35
+ ## Training and evaluation data
36
+
37
+ More information needed
38
+
39
+ ## Training procedure
40
+
41
+ ### Training hyperparameters
42
+
43
+ The following hyperparameters were used during training:
44
+ - learning_rate: 0.0001
45
+ - train_batch_size: 4
46
+ - eval_batch_size: 4
47
+ - seed: 42
48
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
49
+ - lr_scheduler_type: linear
50
+ - num_epochs: 4
51
+
52
+ ### Training results
53
+
54
+ | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
55
+ |:-------------:|:------:|:----:|:---------------:|:------:|:------:|:------:|:---------:|
56
+ | 19.9845 | 0.0251 | 5 | 20.2996 | 0.9748 | 0.2022 | 0.9325 | 0.9418 |
57
+ | 21.4138 | 0.0503 | 10 | 20.5804 | 0.9695 | 0.2108 | 0.9242 | 0.9322 |
58
+ | 22.1251 | 0.0754 | 15 | 20.5377 | 0.9484 | 0.2108 | 0.9059 | 0.9121 |
59
+ | 21.3367 | 0.1005 | 20 | 20.3529 | 0.9310 | 0.1873 | 0.8883 | 0.8910 |
60
+ | 21.8064 | 0.1256 | 25 | 20.1915 | 0.9299 | 0.1873 | 0.8920 | 0.8878 |
61
+ | 22.1628 | 0.1508 | 30 | 19.8701 | 0.9189 | 0.1867 | 0.8760 | 0.8783 |
62
+ | 19.1129 | 0.1759 | 35 | 19.4976 | 0.9189 | 0.1867 | 0.8760 | 0.8783 |
63
+ | 22.7727 | 0.2010 | 40 | 19.3954 | 0.8863 | 0.1693 | 0.8449 | 0.8450 |
64
+ | 19.4877 | 0.2261 | 45 | 19.3051 | 0.8695 | 0.1693 | 0.8311 | 0.8350 |
65
+ | 22.7237 | 0.2513 | 50 | 19.0373 | 0.9211 | 0.1867 | 0.8840 | 0.8873 |
66
+ | 20.0259 | 0.2764 | 55 | 18.8301 | 0.9075 | 0.1867 | 0.8753 | 0.8772 |
67
+ | 20.0452 | 0.3015 | 60 | 18.6446 | 0.9345 | 0.1867 | 0.8992 | 0.9021 |
68
+ | 19.9441 | 0.3266 | 65 | 18.5094 | 0.9493 | 0.1867 | 0.9210 | 0.9190 |
69
+ | 20.6445 | 0.3518 | 70 | 17.7888 | 0.9241 | 0.1867 | 0.8851 | 0.8835 |
70
+ | 20.2272 | 0.3769 | 75 | 17.7626 | 0.8845 | 0.1867 | 0.8603 | 0.8597 |
71
+ | 19.4512 | 0.4020 | 80 | 17.4225 | 0.8690 | 0.1693 | 0.8451 | 0.8463 |
72
+ | 18.6298 | 0.4271 | 85 | 17.2512 | 0.8690 | 0.1693 | 0.8451 | 0.8463 |
73
+ | 19.8135 | 0.4523 | 90 | 16.9832 | 0.8717 | 0.1693 | 0.8470 | 0.8476 |
74
+ | 18.1969 | 0.4774 | 95 | 16.5094 | 0.8603 | 0.1693 | 0.8375 | 0.8378 |
75
+ | 18.2965 | 0.5025 | 100 | 16.2330 | 0.8725 | 0.1693 | 0.8469 | 0.8480 |
76
+ | 17.7528 | 0.5276 | 105 | 15.9999 | 0.9351 | 0.2016 | 0.8999 | 0.9103 |
77
+ | 18.5468 | 0.5528 | 110 | 15.8200 | 0.9093 | 0.2005 | 0.8722 | 0.8864 |
78
+ | 18.5202 | 0.5779 | 115 | 15.2716 | 0.9639 | 0.2307 | 0.9213 | 0.9236 |
79
+ | 18.4827 | 0.6030 | 120 | 15.0205 | 1.0231 | 0.2307 | 0.9861 | 0.9923 |
80
+ | 18.4432 | 0.6281 | 125 | 14.2666 | 1.0696 | 0.2412 | 1.0329 | 1.0385 |
81
+ | 15.5714 | 0.6533 | 130 | 13.8502 | 1.0922 | 0.2793 | 1.0538 | 1.0591 |
82
+ | 16.6447 | 0.6784 | 135 | 13.3299 | 1.1199 | 0.2929 | 1.0721 | 1.0778 |
83
+ | 16.5493 | 0.7035 | 140 | 13.1941 | 1.2006 | 0.2819 | 1.1359 | 1.1420 |
84
+ | 16.5007 | 0.7286 | 145 | 13.0195 | 1.1336 | 0.2819 | 1.0792 | 1.0843 |
85
+ | 15.3121 | 0.7538 | 150 | 12.5816 | 1.0646 | 0.2355 | 1.0290 | 1.0348 |
86
+ | 15.9766 | 0.7789 | 155 | 12.2410 | 1.1067 | 0.2355 | 1.0669 | 1.0773 |
87
+ | 14.5082 | 0.8040 | 160 | 11.9994 | 1.1207 | 0.2355 | 1.0817 | 1.0943 |
88
+ | 14.812 | 0.8291 | 165 | 11.5947 | 1.0905 | 0.2344 | 1.0519 | 1.0659 |
89
+ | 15.0269 | 0.8543 | 170 | 11.3428 | 1.0979 | 0.2357 | 1.0521 | 1.0671 |
90
+ | 14.4106 | 0.8794 | 175 | 11.1049 | 1.1636 | 0.2357 | 1.1055 | 1.1181 |
91
+ | 14.1319 | 0.9045 | 180 | 10.7609 | 1.2215 | 0.2248 | 1.1438 | 1.1535 |
92
+ | 13.8952 | 0.9296 | 185 | 10.5520 | 1.2630 | 0.2248 | 1.1831 | 1.1883 |
93
+ | 12.7063 | 0.9548 | 190 | 10.4312 | 1.3229 | 0.2378 | 1.2448 | 1.2592 |
94
+ | 13.4554 | 0.9799 | 195 | 10.2339 | 1.3215 | 0.2384 | 1.2514 | 1.2582 |
95
+ | 14.6064 | 1.0050 | 200 | 9.9984 | 1.3350 | 0.2384 | 1.2627 | 1.2693 |
96
+ | 12.8018 | 1.0302 | 205 | 9.7809 | 1.3170 | 0.2350 | 1.2483 | 1.2603 |
97
+ | 12.6067 | 1.0553 | 210 | 9.5817 | 1.4603 | 0.2350 | 1.3532 | 1.3609 |
98
+ | 12.7822 | 1.0804 | 215 | 9.4338 | 1.5522 | 0.2447 | 1.4238 | 1.4276 |
99
+ | 12.596 | 1.1055 | 220 | 9.3207 | 1.5781 | 0.2436 | 1.4383 | 1.4388 |
100
+ | 11.9216 | 1.1307 | 225 | 9.1564 | 1.6240 | 0.2417 | 1.4953 | 1.4960 |
101
+ | 12.0841 | 1.1558 | 230 | 9.0333 | 1.7191 | 0.2437 | 1.5857 | 1.5886 |
102
+ | 11.5676 | 1.1809 | 235 | 8.9293 | 1.6431 | 0.2437 | 1.5272 | 1.5248 |
103
+ | 11.4117 | 1.2060 | 240 | 8.7542 | 1.6855 | 0.2447 | 1.5391 | 1.5390 |
104
+ | 11.1348 | 1.2312 | 245 | 8.5618 | 1.8631 | 0.2640 | 1.7019 | 1.7125 |
105
+ | 11.2796 | 1.2563 | 250 | 8.3880 | 1.8559 | 0.2379 | 1.7178 | 1.7262 |
106
+ | 10.7728 | 1.2814 | 255 | 8.2453 | 2.0466 | 0.2500 | 1.8301 | 1.8343 |
107
+ | 10.7193 | 1.3065 | 260 | 8.0746 | 2.0877 | 0.2297 | 1.8682 | 1.8809 |
108
+ | 10.3078 | 1.3317 | 265 | 7.9463 | 2.1213 | 0.2118 | 1.8659 | 1.8702 |
109
+ | 9.4906 | 1.3568 | 270 | 7.8111 | 2.2115 | 0.1872 | 1.9316 | 1.9337 |
110
+ | 9.7248 | 1.3819 | 275 | 7.7112 | 2.3184 | 0.1621 | 2.0219 | 2.0422 |
111
+ | 9.12 | 1.4070 | 280 | 7.6426 | 2.3553 | 0.1770 | 2.0438 | 2.0638 |
112
+ | 9.9925 | 1.4322 | 285 | 7.5105 | 2.2216 | 0.1630 | 1.9617 | 1.9819 |
113
+ | 9.2764 | 1.4573 | 290 | 7.4422 | 2.2106 | 0.1344 | 2.0391 | 2.0359 |
114
+ | 9.0597 | 1.4824 | 295 | 7.3792 | 2.1439 | 0.1053 | 2.0053 | 1.9983 |
115
+ | 8.5065 | 1.5075 | 300 | 7.3106 | 2.0833 | 0.1089 | 1.8708 | 1.8755 |
116
+ | 8.992 | 1.5327 | 305 | 7.2412 | 2.0063 | 0.1084 | 1.8417 | 1.8540 |
117
+ | 8.6069 | 1.5578 | 310 | 7.1944 | 1.9500 | 0.1077 | 1.7940 | 1.8023 |
118
+ | 9.0201 | 1.5829 | 315 | 7.1420 | 2.0260 | 0.0967 | 1.8499 | 1.8535 |
119
+ | 8.8578 | 1.6080 | 320 | 7.0990 | 2.1266 | 0.0860 | 1.9794 | 1.9809 |
120
+ | 8.8284 | 1.6332 | 325 | 7.0596 | 2.0635 | 0.0982 | 1.9106 | 1.9164 |
121
+ | 8.3734 | 1.6583 | 330 | 7.0340 | 1.9703 | 0.0852 | 1.8102 | 1.8107 |
122
+ | 8.6248 | 1.6834 | 335 | 6.9965 | 1.8375 | 0.0843 | 1.7519 | 1.7559 |
123
+ | 8.3218 | 1.7085 | 340 | 6.9770 | 1.8187 | 0.0720 | 1.7496 | 1.7501 |
124
+ | 8.3853 | 1.7337 | 345 | 6.9528 | 1.7610 | 0.0598 | 1.6486 | 1.6470 |
125
+ | 8.4904 | 1.7588 | 350 | 6.9318 | 1.6401 | 0.0486 | 1.5289 | 1.5242 |
126
+ | 8.2582 | 1.7839 | 355 | 6.9122 | 1.6295 | 0.0493 | 1.5232 | 1.5156 |
127
+ | 8.5878 | 1.8090 | 360 | 6.8823 | 1.6154 | 0.0258 | 1.5108 | 1.5050 |
128
+ | 7.7663 | 1.8342 | 365 | 6.8499 | 1.5827 | 0.0258 | 1.5094 | 1.5009 |
129
+ | 8.2 | 1.8593 | 370 | 6.8237 | 1.6436 | 0.0258 | 1.5411 | 1.5388 |
130
+ | 7.5589 | 1.8844 | 375 | 6.8067 | 1.6364 | 0.0258 | 1.5458 | 1.5432 |
131
+ | 8.1803 | 1.9095 | 380 | 6.7845 | 1.5375 | 0.0124 | 1.4493 | 1.4461 |
132
+ | 7.7374 | 1.9347 | 385 | 6.7645 | 1.5121 | 0.0124 | 1.4347 | 1.4303 |
133
+ | 7.8814 | 1.9598 | 390 | 6.7452 | 1.5152 | 0.0124 | 1.4376 | 1.4363 |
134
+ | 7.6648 | 1.9849 | 395 | 6.7257 | 1.5162 | 0.0124 | 1.4428 | 1.4339 |
135
+ | 7.6132 | 2.0101 | 400 | 6.7029 | 1.5577 | 0.0124 | 1.4781 | 1.4777 |
136
+ | 7.864 | 2.0352 | 405 | 6.6846 | 1.6281 | 0.0124 | 1.5464 | 1.5479 |
137
+ | 7.5629 | 2.0603 | 410 | 6.6705 | 1.6544 | 0.0124 | 1.5745 | 1.5703 |
138
+ | 7.6238 | 2.0854 | 415 | 6.6598 | 1.6077 | 0.0124 | 1.5295 | 1.5295 |
139
+ | 7.4898 | 2.1106 | 420 | 6.6395 | 1.6862 | 0.0124 | 1.6088 | 1.6062 |
140
+ | 7.8069 | 2.1357 | 425 | 6.6117 | 1.7010 | 0.0124 | 1.6381 | 1.6358 |
141
+ | 7.4597 | 2.1608 | 430 | 6.5884 | 1.7218 | 0.0124 | 1.6599 | 1.6582 |
142
+ | 7.3898 | 2.1859 | 435 | 6.5677 | 1.7601 | 0.0124 | 1.7094 | 1.7086 |
143
+ | 7.3911 | 2.2111 | 440 | 6.5463 | 1.8674 | 0.0124 | 1.8057 | 1.7979 |
144
+ | 7.1733 | 2.2362 | 445 | 6.5197 | 1.8953 | 0.0124 | 1.8350 | 1.8341 |
145
+ | 7.1887 | 2.2613 | 450 | 6.4986 | 1.9404 | 0.0124 | 1.8864 | 1.8842 |
146
+ | 7.0774 | 2.2864 | 455 | 6.4825 | 2.0663 | 0.0124 | 2.0050 | 2.0030 |
147
+ | 7.2954 | 2.3116 | 460 | 6.4684 | 2.1557 | 0.0124 | 2.0807 | 2.0742 |
148
+ | 7.0925 | 2.3367 | 465 | 6.4529 | 2.2422 | 0.0124 | 2.1712 | 2.1695 |
149
+ | 7.1943 | 2.3618 | 470 | 6.4348 | 2.3632 | 0.0124 | 2.2752 | 2.2679 |
150
+ | 7.0861 | 2.3869 | 475 | 6.4134 | 2.4368 | 0.0124 | 2.3484 | 2.3430 |
151
+ | 7.18 | 2.4121 | 480 | 6.3854 | 2.5631 | 0.0124 | 2.4796 | 2.4720 |
152
+ | 7.2415 | 2.4372 | 485 | 6.3554 | 2.6147 | 0.0124 | 2.5171 | 2.5113 |
153
+ | 7.0627 | 2.4623 | 490 | 6.3225 | 2.7857 | 0.0124 | 2.6762 | 2.6708 |
154
+ | 7.2473 | 2.4874 | 495 | 6.2878 | 2.8660 | 0.0 | 2.7604 | 2.7589 |
155
+ | 7.1432 | 2.5126 | 500 | 6.2584 | 3.0089 | 0.0 | 2.8942 | 2.9031 |
156
+ | 6.8786 | 2.5377 | 505 | 6.2204 | 3.0677 | 0.0 | 2.9803 | 2.9827 |
157
+ | 7.2605 | 2.5628 | 510 | 6.1884 | 3.1637 | 0.0 | 3.0661 | 3.0713 |
158
+ | 6.8372 | 2.5879 | 515 | 6.1583 | 3.2234 | 0.0 | 3.1330 | 3.1292 |
159
+ | 6.9582 | 2.6131 | 520 | 6.1281 | 3.4104 | 0.0 | 3.2578 | 3.2674 |
160
+ | 6.834 | 2.6382 | 525 | 6.0949 | 3.5180 | 0.0137 | 3.3648 | 3.3729 |
161
+ | 7.065 | 2.6633 | 530 | 6.0598 | 3.5609 | 0.0137 | 3.4115 | 3.4148 |
162
+ | 6.8041 | 2.6884 | 535 | 6.0301 | 3.6212 | 0.0263 | 3.4610 | 3.4601 |
163
+ | 7.0177 | 2.7136 | 540 | 6.0045 | 3.6462 | 0.0263 | 3.4834 | 3.4829 |
164
+ | 6.7565 | 2.7387 | 545 | 5.9789 | 3.6683 | 0.0263 | 3.5033 | 3.5079 |
165
+ | 6.6908 | 2.7638 | 550 | 5.9469 | 3.6961 | 0.0263 | 3.5384 | 3.5331 |
166
+ | 6.6701 | 2.7889 | 555 | 5.9122 | 3.8271 | 0.0398 | 3.6780 | 3.6719 |
167
+ | 6.703 | 2.8141 | 560 | 5.8798 | 3.9789 | 0.0399 | 3.8203 | 3.8054 |
168
+ | 6.7734 | 2.8392 | 565 | 5.8518 | 4.0644 | 0.0533 | 3.9002 | 3.9022 |
169
+ | 6.8523 | 2.8643 | 570 | 5.8196 | 4.0991 | 0.0653 | 3.9677 | 3.9648 |
170
+ | 6.477 | 2.8894 | 575 | 5.7907 | 4.1666 | 0.0914 | 4.0340 | 4.0302 |
171
+ | 6.8284 | 2.9146 | 580 | 5.7659 | 4.1567 | 0.0914 | 4.0088 | 4.0067 |
172
+ | 6.8174 | 2.9397 | 585 | 5.7360 | 4.2228 | 0.0914 | 4.0340 | 4.0372 |
173
+ | 6.7112 | 2.9648 | 590 | 5.7117 | 4.2814 | 0.0915 | 4.0661 | 4.0639 |
174
+ | 6.5568 | 2.9899 | 595 | 5.6804 | 4.3052 | 0.1413 | 4.0651 | 4.0724 |
175
+ | 6.4933 | 3.0151 | 600 | 5.6472 | 4.3145 | 0.1273 | 4.0867 | 4.0873 |
176
+ | 6.3 | 3.0402 | 605 | 5.5958 | 4.2657 | 0.1510 | 4.0182 | 4.0272 |
177
+ | 6.5645 | 3.0653 | 610 | 5.5545 | 4.2810 | 0.1695 | 4.0035 | 3.9989 |
178
+ | 6.5585 | 3.0905 | 615 | 5.5188 | 4.3714 | 0.1699 | 4.1262 | 4.1184 |
179
+ | 6.5803 | 3.1156 | 620 | 5.4954 | 4.3159 | 0.1574 | 4.0346 | 4.0352 |
180
+ | 6.3667 | 3.1407 | 625 | 5.4669 | 4.4380 | 0.1829 | 4.1416 | 4.1304 |
181
+ | 6.4128 | 3.1658 | 630 | 5.4418 | 4.4830 | 0.1828 | 4.1453 | 4.1436 |
182
+ | 6.2 | 3.1910 | 635 | 5.4183 | 4.5121 | 0.1953 | 4.1746 | 4.1750 |
183
+ | 6.2363 | 3.2161 | 640 | 5.3853 | 4.6840 | 0.2092 | 4.3241 | 4.3157 |
184
+ | 6.3394 | 3.2412 | 645 | 5.3572 | 4.6549 | 0.1969 | 4.3112 | 4.3093 |
185
+ | 6.3711 | 3.2663 | 650 | 5.3348 | 4.8189 | 0.2395 | 4.4461 | 4.4309 |
186
+ | 6.3356 | 3.2915 | 655 | 5.3154 | 4.7549 | 0.2282 | 4.3740 | 4.3551 |
187
+ | 6.2359 | 3.3166 | 660 | 5.2990 | 4.7922 | 0.2556 | 4.3994 | 4.3842 |
188
+ | 6.1759 | 3.3417 | 665 | 5.2830 | 4.9007 | 0.2765 | 4.4718 | 4.4659 |
189
+ | 6.5212 | 3.3668 | 670 | 5.2652 | 4.8672 | 0.2772 | 4.4498 | 4.4419 |
190
+ | 6.3572 | 3.3920 | 675 | 5.2523 | 4.8740 | 0.2921 | 4.4736 | 4.4664 |
191
+ | 6.142 | 3.4171 | 680 | 5.2297 | 4.8456 | 0.3048 | 4.4642 | 4.4639 |
192
+ | 6.2698 | 3.4422 | 685 | 5.2075 | 4.9942 | 0.3382 | 4.5893 | 4.5796 |
193
+ | 6.1898 | 3.4673 | 690 | 5.1786 | 5.0596 | 0.3377 | 4.6012 | 4.6013 |
194
+ | 6.1935 | 3.4925 | 695 | 5.1579 | 5.1421 | 0.3352 | 4.6368 | 4.6311 |
195
+ | 6.0207 | 3.5176 | 700 | 5.1373 | 5.1597 | 0.3198 | 4.6450 | 4.6314 |
196
+ | 6.2054 | 3.5427 | 705 | 5.1142 | 5.3065 | 0.3589 | 4.7477 | 4.7568 |
197
+ | 6.0647 | 3.5678 | 710 | 5.0953 | 5.3270 | 0.4192 | 4.7751 | 4.7847 |
198
+ | 6.2467 | 3.5930 | 715 | 5.0779 | 5.3485 | 0.4558 | 4.7980 | 4.8109 |
199
+ | 6.2021 | 3.6181 | 720 | 5.0642 | 5.3178 | 0.4558 | 4.7720 | 4.7920 |
200
+ | 6.1525 | 3.6432 | 725 | 5.0512 | 5.2626 | 0.4670 | 4.7375 | 4.7532 |
201
+ | 5.9856 | 3.6683 | 730 | 5.0375 | 5.3317 | 0.4597 | 4.7651 | 4.7658 |
202
+ | 6.3415 | 3.6935 | 735 | 5.0281 | 5.2917 | 0.4597 | 4.7487 | 4.7482 |
203
+ | 5.9981 | 3.7186 | 740 | 5.0204 | 5.2751 | 0.4597 | 4.7114 | 4.7088 |
204
+ | 6.1648 | 3.7437 | 745 | 5.0091 | 5.2866 | 0.4597 | 4.7184 | 4.7199 |
205
+ | 6.1724 | 3.7688 | 750 | 5.0011 | 5.3533 | 0.4597 | 4.7817 | 4.7842 |
206
+ | 6.0231 | 3.7940 | 755 | 4.9939 | 5.3533 | 0.4597 | 4.7817 | 4.7842 |
207
+ | 5.9608 | 3.8191 | 760 | 4.9870 | 5.4313 | 0.4952 | 4.8477 | 4.8522 |
208
+ | 6.1358 | 3.8442 | 765 | 4.9817 | 5.4523 | 0.5043 | 4.8543 | 4.8664 |
209
+ | 6.061 | 3.8693 | 770 | 4.9765 | 5.5196 | 0.5196 | 4.8860 | 4.8956 |
210
+ | 6.2685 | 3.8945 | 775 | 4.9726 | 5.4864 | 0.5196 | 4.8490 | 4.8594 |
211
+ | 6.0714 | 3.9196 | 780 | 4.9702 | 5.4314 | 0.5196 | 4.8078 | 4.8230 |
212
+ | 6.1423 | 3.9447 | 785 | 4.9686 | 5.3819 | 0.5196 | 4.7713 | 4.7866 |
213
+ | 5.931 | 3.9698 | 790 | 4.9676 | 5.4160 | 0.5196 | 4.8078 | 4.8230 |
214
+ | 6.148 | 3.9950 | 795 | 4.9672 | 5.3819 | 0.5196 | 4.7713 | 4.7866 |
215
+
216
+
217
+ ### Framework versions
218
+
219
+ - PEFT 0.14.0
220
+ - Transformers 4.49.0
221
+ - Pytorch 2.6.0+cu124
222
+ - Datasets 3.3.2
223
+ - Tokenizers 0.21.0
adapter_config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "google/mt5-base",
5
+ "bias": "none",
6
+ "eva_config": null,
7
+ "exclude_modules": null,
8
+ "fan_in_fan_out": false,
9
+ "inference_mode": true,
10
+ "init_lora_weights": true,
11
+ "layer_replication": null,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "loftq_config": {},
15
+ "lora_alpha": 16,
16
+ "lora_bias": false,
17
+ "lora_dropout": 0.2,
18
+ "megatron_config": null,
19
+ "megatron_core": "megatron.core",
20
+ "modules_to_save": null,
21
+ "peft_type": "LORA",
22
+ "r": 1,
23
+ "rank_pattern": {},
24
+ "revision": null,
25
+ "target_modules": [
26
+ "q",
27
+ "v"
28
+ ],
29
+ "task_type": "SEQ_2_SEQ_LM",
30
+ "use_dora": false,
31
+ "use_rslora": false
32
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9cf6f7f3e88221425f733f47059a8577b1dacca61397d9d11f9b698015cbcd2
3
+ size 462040
runs/Mar10_23-08-48_1412920010036/events.out.tfevents.1741662535.1412920010036.5471.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d86bf84720e7f90ac974efa75515570b134c9d405e77c7b946753da0a78708c9
3
+ size 91015
runs/Mar10_23-08-48_1412920010036/events.out.tfevents.1741667746.1412920010036.5471.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:792a75e640434bf8aa50b1ef06323080a1c16079af61c3bf8694eb452fad42a6
3
+ size 562
runs/Mar11_00-36-23_1412920010036/events.out.tfevents.1741667784.1412920010036.5471.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a0ec7de23abb4f0a5d2089d151629190d92f5ec867f3f325c6be120106b2fe
3
+ size 59508
runs/Mar11_00-36-23_1412920010036/events.out.tfevents.1741668489.1412920010036.5471.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf2e319d10421337f47f1e8b3f46bae0ad327b388a3e7f90b0e1965ffdbc5d5a
3
+ size 562
runs/Mar11_00-48-17_1412920010036/events.out.tfevents.1741668498.1412920010036.5471.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d85e822375a87e28f05d12ef333b2fb6fd159fe4f9a19f1f70ba612647cfb70a
3
+ size 91030
runs/Mar11_00-48-17_1412920010036/events.out.tfevents.1741673649.1412920010036.5471.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00f80e0e8a6988580e823614cd7f35439cdb0938a3ace2d1fd4358ba8f788052
3
+ size 562
runs/Mar11_08-18-41_1412920010036/events.out.tfevents.1741695522.1412920010036.235349.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a351088403358a6e3ed6d487f24a9e6b63a3c00043cebc546bf195ce0ad75e0
3
+ size 8924
runs/Mar11_08-36-50_1412920010036/events.out.tfevents.1741696613.1412920010036.243166.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8b85c7d0e23e119678b0ca6026c0a32bbd115ca0c00d66d7557d08945fcbb2a
3
+ size 176636
runs/Mar11_08-36-50_1412920010036/events.out.tfevents.1741706871.1412920010036.243166.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f1c7671cba5b2b3a49d643cc0171f5caa39468117d1aabefa9df00cb178ea3
3
+ size 562
runs/Mar11_11-28-33_1412920010036/events.out.tfevents.1741706915.1412920010036.243166.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0d6042ab546ed0306f50935e16c50c7da9d5ab234567950aa455979e0d1d44b
3
+ size 114304
runs/Mar11_11-28-33_1412920010036/events.out.tfevents.1741708827.1412920010036.243166.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a68052302a939cdcae8f660c29206fda498cf5bd6156f7c0759b5a0511db490
3
+ size 562
runs/Mar11_12-01-09_1412920010036/events.out.tfevents.1741708871.1412920010036.243166.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afbc32f901a15cf55d6682328172fa8bb18c97a8dab6fe53e34a905894f45b81
3
+ size 176651
runs/Mar11_12-01-09_1412920010036/events.out.tfevents.1741719010.1412920010036.243166.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dde0983bb360cd2d8485acc60044ed44bc470fd1bcd2aeb72bf83071abb8830d
3
+ size 562
runs/Mar16_11-09-16_1412920010036/events.out.tfevents.1742137758.1412920010036.2788175.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c50c6e0e23cd477a941b5d36a0d321e120e2bb69ba10fcca7f99734a6d4e91
3
+ size 262262
runs/Mar16_11-09-16_1412920010036/events.out.tfevents.1742153024.1412920010036.2788175.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d7672a87a44b3c3be97bcccc40603e3e4e82b5c3627cb1f398433cae9ac13fe
3
+ size 562
runs/Mar16_15-24-22_1412920010036/events.out.tfevents.1742153062.1412920010036.2788175.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fef2de389fb253754c18816e070fb8af75dac7f30933574f3dc7c96f864fc526
3
+ size 168420
runs/Mar16_15-24-22_1412920010036/events.out.tfevents.1742156125.1412920010036.2788175.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4586f738fa7df3f2666120efc09f54f65166e7621e08fc10ffef59ec9a2020d2
3
+ size 562
runs/Mar16_16-16-04_1412920010036/events.out.tfevents.1742156165.1412920010036.2788175.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceb08d948a1eb1c826c753f0c293111bedf46d85ed84b6634e2fb85431ed228b
3
+ size 262277
runs/Mar16_16-16-04_1412920010036/events.out.tfevents.1742171274.1412920010036.2788175.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80794494318f8e72dd2c18d665fb1bc8b461fd279b108675b08f1f73b263d639
3
+ size 562
runs/Mar16_20-40-24_1412920010036/events.out.tfevents.1742172027.1412920010036.3060254.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4035bc34d5cf7ec7662fab1d6416ed9a240003daf2f09f375e04024aa8ebe86d
3
+ size 17477
runs/Mar17_07-22-30_1412920010036/events.out.tfevents.1742210552.1412920010036.3303252.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:631b00899e9781ae2a115de6c819b5863214fcf343c98aab124f3bd3c90a0126
3
+ size 139673
runs/Mar17_07-22-30_1412920010036/events.out.tfevents.1742223668.1412920010036.3303252.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:032299957c07243cf0cc63af798d55dfcd56cbef728c7e973ea43420a05ff1dc
3
+ size 562
runs/Mar17_11-02-11_1412920010036/events.out.tfevents.1742223732.1412920010036.3303252.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94437c1acaee1ae9ba1024863b24f5d32384f936043c581c4300eabc6ce92371
3
+ size 114331
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eos_token": {
3
+ "content": "</s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "pad_token": {
10
+ "content": "<pad>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90ed658667887a6a72b5f071e2e34bd3d9c562683f9c71a2f9c7c1c414e6c5bc
3
+ size 16350026
tokenizer_config.json ADDED
@@ -0,0 +1,840 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": null,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<pad>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "</s>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "<unk>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "250000": {
29
+ "content": "▁<extra_id_99>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": false
35
+ },
36
+ "250001": {
37
+ "content": "▁<extra_id_98>",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": false
43
+ },
44
+ "250002": {
45
+ "content": "▁<extra_id_97>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": false
51
+ },
52
+ "250003": {
53
+ "content": "▁<extra_id_96>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": false
59
+ },
60
+ "250004": {
61
+ "content": "▁<extra_id_95>",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": false
67
+ },
68
+ "250005": {
69
+ "content": "▁<extra_id_94>",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": false
75
+ },
76
+ "250006": {
77
+ "content": "▁<extra_id_93>",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": false
83
+ },
84
+ "250007": {
85
+ "content": "▁<extra_id_92>",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": false
91
+ },
92
+ "250008": {
93
+ "content": "▁<extra_id_91>",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": false
99
+ },
100
+ "250009": {
101
+ "content": "▁<extra_id_90>",
102
+ "lstrip": false,
103
+ "normalized": false,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": false
107
+ },
108
+ "250010": {
109
+ "content": "▁<extra_id_89>",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": false
115
+ },
116
+ "250011": {
117
+ "content": "▁<extra_id_88>",
118
+ "lstrip": false,
119
+ "normalized": false,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": false
123
+ },
124
+ "250012": {
125
+ "content": "▁<extra_id_87>",
126
+ "lstrip": false,
127
+ "normalized": false,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": false
131
+ },
132
+ "250013": {
133
+ "content": "▁<extra_id_86>",
134
+ "lstrip": false,
135
+ "normalized": false,
136
+ "rstrip": false,
137
+ "single_word": false,
138
+ "special": false
139
+ },
140
+ "250014": {
141
+ "content": "▁<extra_id_85>",
142
+ "lstrip": false,
143
+ "normalized": false,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": false
147
+ },
148
+ "250015": {
149
+ "content": "▁<extra_id_84>",
150
+ "lstrip": false,
151
+ "normalized": false,
152
+ "rstrip": false,
153
+ "single_word": false,
154
+ "special": false
155
+ },
156
+ "250016": {
157
+ "content": "▁<extra_id_83>",
158
+ "lstrip": false,
159
+ "normalized": false,
160
+ "rstrip": false,
161
+ "single_word": false,
162
+ "special": false
163
+ },
164
+ "250017": {
165
+ "content": "▁<extra_id_82>",
166
+ "lstrip": false,
167
+ "normalized": false,
168
+ "rstrip": false,
169
+ "single_word": false,
170
+ "special": false
171
+ },
172
+ "250018": {
173
+ "content": "▁<extra_id_81>",
174
+ "lstrip": false,
175
+ "normalized": false,
176
+ "rstrip": false,
177
+ "single_word": false,
178
+ "special": false
179
+ },
180
+ "250019": {
181
+ "content": "▁<extra_id_80>",
182
+ "lstrip": false,
183
+ "normalized": false,
184
+ "rstrip": false,
185
+ "single_word": false,
186
+ "special": false
187
+ },
188
+ "250020": {
189
+ "content": "▁<extra_id_79>",
190
+ "lstrip": false,
191
+ "normalized": false,
192
+ "rstrip": false,
193
+ "single_word": false,
194
+ "special": false
195
+ },
196
+ "250021": {
197
+ "content": "▁<extra_id_78>",
198
+ "lstrip": false,
199
+ "normalized": false,
200
+ "rstrip": false,
201
+ "single_word": false,
202
+ "special": false
203
+ },
204
+ "250022": {
205
+ "content": "▁<extra_id_77>",
206
+ "lstrip": false,
207
+ "normalized": false,
208
+ "rstrip": false,
209
+ "single_word": false,
210
+ "special": false
211
+ },
212
+ "250023": {
213
+ "content": "▁<extra_id_76>",
214
+ "lstrip": false,
215
+ "normalized": false,
216
+ "rstrip": false,
217
+ "single_word": false,
218
+ "special": false
219
+ },
220
+ "250024": {
221
+ "content": "▁<extra_id_75>",
222
+ "lstrip": false,
223
+ "normalized": false,
224
+ "rstrip": false,
225
+ "single_word": false,
226
+ "special": false
227
+ },
228
+ "250025": {
229
+ "content": "▁<extra_id_74>",
230
+ "lstrip": false,
231
+ "normalized": false,
232
+ "rstrip": false,
233
+ "single_word": false,
234
+ "special": false
235
+ },
236
+ "250026": {
237
+ "content": "▁<extra_id_73>",
238
+ "lstrip": false,
239
+ "normalized": false,
240
+ "rstrip": false,
241
+ "single_word": false,
242
+ "special": false
243
+ },
244
+ "250027": {
245
+ "content": "▁<extra_id_72>",
246
+ "lstrip": false,
247
+ "normalized": false,
248
+ "rstrip": false,
249
+ "single_word": false,
250
+ "special": false
251
+ },
252
+ "250028": {
253
+ "content": "▁<extra_id_71>",
254
+ "lstrip": false,
255
+ "normalized": false,
256
+ "rstrip": false,
257
+ "single_word": false,
258
+ "special": false
259
+ },
260
+ "250029": {
261
+ "content": "▁<extra_id_70>",
262
+ "lstrip": false,
263
+ "normalized": false,
264
+ "rstrip": false,
265
+ "single_word": false,
266
+ "special": false
267
+ },
268
+ "250030": {
269
+ "content": "▁<extra_id_69>",
270
+ "lstrip": false,
271
+ "normalized": false,
272
+ "rstrip": false,
273
+ "single_word": false,
274
+ "special": false
275
+ },
276
+ "250031": {
277
+ "content": "▁<extra_id_68>",
278
+ "lstrip": false,
279
+ "normalized": false,
280
+ "rstrip": false,
281
+ "single_word": false,
282
+ "special": false
283
+ },
284
+ "250032": {
285
+ "content": "▁<extra_id_67>",
286
+ "lstrip": false,
287
+ "normalized": false,
288
+ "rstrip": false,
289
+ "single_word": false,
290
+ "special": false
291
+ },
292
+ "250033": {
293
+ "content": "▁<extra_id_66>",
294
+ "lstrip": false,
295
+ "normalized": false,
296
+ "rstrip": false,
297
+ "single_word": false,
298
+ "special": false
299
+ },
300
+ "250034": {
301
+ "content": "▁<extra_id_65>",
302
+ "lstrip": false,
303
+ "normalized": false,
304
+ "rstrip": false,
305
+ "single_word": false,
306
+ "special": false
307
+ },
308
+ "250035": {
309
+ "content": "▁<extra_id_64>",
310
+ "lstrip": false,
311
+ "normalized": false,
312
+ "rstrip": false,
313
+ "single_word": false,
314
+ "special": false
315
+ },
316
+ "250036": {
317
+ "content": "▁<extra_id_63>",
318
+ "lstrip": false,
319
+ "normalized": false,
320
+ "rstrip": false,
321
+ "single_word": false,
322
+ "special": false
323
+ },
324
+ "250037": {
325
+ "content": "▁<extra_id_62>",
326
+ "lstrip": false,
327
+ "normalized": false,
328
+ "rstrip": false,
329
+ "single_word": false,
330
+ "special": false
331
+ },
332
+ "250038": {
333
+ "content": "▁<extra_id_61>",
334
+ "lstrip": false,
335
+ "normalized": false,
336
+ "rstrip": false,
337
+ "single_word": false,
338
+ "special": false
339
+ },
340
+ "250039": {
341
+ "content": "▁<extra_id_60>",
342
+ "lstrip": false,
343
+ "normalized": false,
344
+ "rstrip": false,
345
+ "single_word": false,
346
+ "special": false
347
+ },
348
+ "250040": {
349
+ "content": "▁<extra_id_59>",
350
+ "lstrip": false,
351
+ "normalized": false,
352
+ "rstrip": false,
353
+ "single_word": false,
354
+ "special": false
355
+ },
356
+ "250041": {
357
+ "content": "▁<extra_id_58>",
358
+ "lstrip": false,
359
+ "normalized": false,
360
+ "rstrip": false,
361
+ "single_word": false,
362
+ "special": false
363
+ },
364
+ "250042": {
365
+ "content": "▁<extra_id_57>",
366
+ "lstrip": false,
367
+ "normalized": false,
368
+ "rstrip": false,
369
+ "single_word": false,
370
+ "special": false
371
+ },
372
+ "250043": {
373
+ "content": "▁<extra_id_56>",
374
+ "lstrip": false,
375
+ "normalized": false,
376
+ "rstrip": false,
377
+ "single_word": false,
378
+ "special": false
379
+ },
380
+ "250044": {
381
+ "content": "▁<extra_id_55>",
382
+ "lstrip": false,
383
+ "normalized": false,
384
+ "rstrip": false,
385
+ "single_word": false,
386
+ "special": false
387
+ },
388
+ "250045": {
389
+ "content": "▁<extra_id_54>",
390
+ "lstrip": false,
391
+ "normalized": false,
392
+ "rstrip": false,
393
+ "single_word": false,
394
+ "special": false
395
+ },
396
+ "250046": {
397
+ "content": "▁<extra_id_53>",
398
+ "lstrip": false,
399
+ "normalized": false,
400
+ "rstrip": false,
401
+ "single_word": false,
402
+ "special": false
403
+ },
404
+ "250047": {
405
+ "content": "▁<extra_id_52>",
406
+ "lstrip": false,
407
+ "normalized": false,
408
+ "rstrip": false,
409
+ "single_word": false,
410
+ "special": false
411
+ },
412
+ "250048": {
413
+ "content": "▁<extra_id_51>",
414
+ "lstrip": false,
415
+ "normalized": false,
416
+ "rstrip": false,
417
+ "single_word": false,
418
+ "special": false
419
+ },
420
+ "250049": {
421
+ "content": "▁<extra_id_50>",
422
+ "lstrip": false,
423
+ "normalized": false,
424
+ "rstrip": false,
425
+ "single_word": false,
426
+ "special": false
427
+ },
428
+ "250050": {
429
+ "content": "οΏ½οΏ½οΏ½<extra_id_49>",
430
+ "lstrip": false,
431
+ "normalized": false,
432
+ "rstrip": false,
433
+ "single_word": false,
434
+ "special": false
435
+ },
436
+ "250051": {
437
+ "content": "▁<extra_id_48>",
438
+ "lstrip": false,
439
+ "normalized": false,
440
+ "rstrip": false,
441
+ "single_word": false,
442
+ "special": false
443
+ },
444
+ "250052": {
445
+ "content": "▁<extra_id_47>",
446
+ "lstrip": false,
447
+ "normalized": false,
448
+ "rstrip": false,
449
+ "single_word": false,
450
+ "special": false
451
+ },
452
+ "250053": {
453
+ "content": "▁<extra_id_46>",
454
+ "lstrip": false,
455
+ "normalized": false,
456
+ "rstrip": false,
457
+ "single_word": false,
458
+ "special": false
459
+ },
460
+ "250054": {
461
+ "content": "▁<extra_id_45>",
462
+ "lstrip": false,
463
+ "normalized": false,
464
+ "rstrip": false,
465
+ "single_word": false,
466
+ "special": false
467
+ },
468
+ "250055": {
469
+ "content": "▁<extra_id_44>",
470
+ "lstrip": false,
471
+ "normalized": false,
472
+ "rstrip": false,
473
+ "single_word": false,
474
+ "special": false
475
+ },
476
+ "250056": {
477
+ "content": "▁<extra_id_43>",
478
+ "lstrip": false,
479
+ "normalized": false,
480
+ "rstrip": false,
481
+ "single_word": false,
482
+ "special": false
483
+ },
484
+ "250057": {
485
+ "content": "▁<extra_id_42>",
486
+ "lstrip": false,
487
+ "normalized": false,
488
+ "rstrip": false,
489
+ "single_word": false,
490
+ "special": false
491
+ },
492
+ "250058": {
493
+ "content": "▁<extra_id_41>",
494
+ "lstrip": false,
495
+ "normalized": false,
496
+ "rstrip": false,
497
+ "single_word": false,
498
+ "special": false
499
+ },
500
+ "250059": {
501
+ "content": "▁<extra_id_40>",
502
+ "lstrip": false,
503
+ "normalized": false,
504
+ "rstrip": false,
505
+ "single_word": false,
506
+ "special": false
507
+ },
508
+ "250060": {
509
+ "content": "▁<extra_id_39>",
510
+ "lstrip": false,
511
+ "normalized": false,
512
+ "rstrip": false,
513
+ "single_word": false,
514
+ "special": false
515
+ },
516
+ "250061": {
517
+ "content": "▁<extra_id_38>",
518
+ "lstrip": false,
519
+ "normalized": false,
520
+ "rstrip": false,
521
+ "single_word": false,
522
+ "special": false
523
+ },
524
+ "250062": {
525
+ "content": "▁<extra_id_37>",
526
+ "lstrip": false,
527
+ "normalized": false,
528
+ "rstrip": false,
529
+ "single_word": false,
530
+ "special": false
531
+ },
532
+ "250063": {
533
+ "content": "▁<extra_id_36>",
534
+ "lstrip": false,
535
+ "normalized": false,
536
+ "rstrip": false,
537
+ "single_word": false,
538
+ "special": false
539
+ },
540
+ "250064": {
541
+ "content": "▁<extra_id_35>",
542
+ "lstrip": false,
543
+ "normalized": false,
544
+ "rstrip": false,
545
+ "single_word": false,
546
+ "special": false
547
+ },
548
+ "250065": {
549
+ "content": "▁<extra_id_34>",
550
+ "lstrip": false,
551
+ "normalized": false,
552
+ "rstrip": false,
553
+ "single_word": false,
554
+ "special": false
555
+ },
556
+ "250066": {
557
+ "content": "▁<extra_id_33>",
558
+ "lstrip": false,
559
+ "normalized": false,
560
+ "rstrip": false,
561
+ "single_word": false,
562
+ "special": false
563
+ },
564
+ "250067": {
565
+ "content": "▁<extra_id_32>",
566
+ "lstrip": false,
567
+ "normalized": false,
568
+ "rstrip": false,
569
+ "single_word": false,
570
+ "special": false
571
+ },
572
+ "250068": {
573
+ "content": "▁<extra_id_31>",
574
+ "lstrip": false,
575
+ "normalized": false,
576
+ "rstrip": false,
577
+ "single_word": false,
578
+ "special": false
579
+ },
580
+ "250069": {
581
+ "content": "▁<extra_id_30>",
582
+ "lstrip": false,
583
+ "normalized": false,
584
+ "rstrip": false,
585
+ "single_word": false,
586
+ "special": false
587
+ },
588
+ "250070": {
589
+ "content": "▁<extra_id_29>",
590
+ "lstrip": false,
591
+ "normalized": false,
592
+ "rstrip": false,
593
+ "single_word": false,
594
+ "special": false
595
+ },
596
+ "250071": {
597
+ "content": "▁<extra_id_28>",
598
+ "lstrip": false,
599
+ "normalized": false,
600
+ "rstrip": false,
601
+ "single_word": false,
602
+ "special": false
603
+ },
604
+ "250072": {
605
+ "content": "▁<extra_id_27>",
606
+ "lstrip": false,
607
+ "normalized": false,
608
+ "rstrip": false,
609
+ "single_word": false,
610
+ "special": false
611
+ },
612
+ "250073": {
613
+ "content": "▁<extra_id_26>",
614
+ "lstrip": false,
615
+ "normalized": false,
616
+ "rstrip": false,
617
+ "single_word": false,
618
+ "special": false
619
+ },
620
+ "250074": {
621
+ "content": "▁<extra_id_25>",
622
+ "lstrip": false,
623
+ "normalized": false,
624
+ "rstrip": false,
625
+ "single_word": false,
626
+ "special": false
627
+ },
628
+ "250075": {
629
+ "content": "▁<extra_id_24>",
630
+ "lstrip": false,
631
+ "normalized": false,
632
+ "rstrip": false,
633
+ "single_word": false,
634
+ "special": false
635
+ },
636
+ "250076": {
637
+ "content": "▁<extra_id_23>",
638
+ "lstrip": false,
639
+ "normalized": false,
640
+ "rstrip": false,
641
+ "single_word": false,
642
+ "special": false
643
+ },
644
+ "250077": {
645
+ "content": "▁<extra_id_22>",
646
+ "lstrip": false,
647
+ "normalized": false,
648
+ "rstrip": false,
649
+ "single_word": false,
650
+ "special": false
651
+ },
652
+ "250078": {
653
+ "content": "▁<extra_id_21>",
654
+ "lstrip": false,
655
+ "normalized": false,
656
+ "rstrip": false,
657
+ "single_word": false,
658
+ "special": false
659
+ },
660
+ "250079": {
661
+ "content": "▁<extra_id_20>",
662
+ "lstrip": false,
663
+ "normalized": false,
664
+ "rstrip": false,
665
+ "single_word": false,
666
+ "special": false
667
+ },
668
+ "250080": {
669
+ "content": "▁<extra_id_19>",
670
+ "lstrip": false,
671
+ "normalized": false,
672
+ "rstrip": false,
673
+ "single_word": false,
674
+ "special": false
675
+ },
676
+ "250081": {
677
+ "content": "▁<extra_id_18>",
678
+ "lstrip": false,
679
+ "normalized": false,
680
+ "rstrip": false,
681
+ "single_word": false,
682
+ "special": false
683
+ },
684
+ "250082": {
685
+ "content": "▁<extra_id_17>",
686
+ "lstrip": false,
687
+ "normalized": false,
688
+ "rstrip": false,
689
+ "single_word": false,
690
+ "special": false
691
+ },
692
+ "250083": {
693
+ "content": "▁<extra_id_16>",
694
+ "lstrip": false,
695
+ "normalized": false,
696
+ "rstrip": false,
697
+ "single_word": false,
698
+ "special": false
699
+ },
700
+ "250084": {
701
+ "content": "▁<extra_id_15>",
702
+ "lstrip": false,
703
+ "normalized": false,
704
+ "rstrip": false,
705
+ "single_word": false,
706
+ "special": false
707
+ },
708
+ "250085": {
709
+ "content": "▁<extra_id_14>",
710
+ "lstrip": false,
711
+ "normalized": false,
712
+ "rstrip": false,
713
+ "single_word": false,
714
+ "special": false
715
+ },
716
+ "250086": {
717
+ "content": "▁<extra_id_13>",
718
+ "lstrip": false,
719
+ "normalized": false,
720
+ "rstrip": false,
721
+ "single_word": false,
722
+ "special": false
723
+ },
724
+ "250087": {
725
+ "content": "▁<extra_id_12>",
726
+ "lstrip": false,
727
+ "normalized": false,
728
+ "rstrip": false,
729
+ "single_word": false,
730
+ "special": false
731
+ },
732
+ "250088": {
733
+ "content": "▁<extra_id_11>",
734
+ "lstrip": false,
735
+ "normalized": false,
736
+ "rstrip": false,
737
+ "single_word": false,
738
+ "special": false
739
+ },
740
+ "250089": {
741
+ "content": "▁<extra_id_10>",
742
+ "lstrip": false,
743
+ "normalized": false,
744
+ "rstrip": false,
745
+ "single_word": false,
746
+ "special": false
747
+ },
748
+ "250090": {
749
+ "content": "▁<extra_id_9>",
750
+ "lstrip": false,
751
+ "normalized": false,
752
+ "rstrip": false,
753
+ "single_word": false,
754
+ "special": false
755
+ },
756
+ "250091": {
757
+ "content": "▁<extra_id_8>",
758
+ "lstrip": false,
759
+ "normalized": false,
760
+ "rstrip": false,
761
+ "single_word": false,
762
+ "special": false
763
+ },
764
+ "250092": {
765
+ "content": "▁<extra_id_7>",
766
+ "lstrip": false,
767
+ "normalized": false,
768
+ "rstrip": false,
769
+ "single_word": false,
770
+ "special": false
771
+ },
772
+ "250093": {
773
+ "content": "▁<extra_id_6>",
774
+ "lstrip": false,
775
+ "normalized": false,
776
+ "rstrip": false,
777
+ "single_word": false,
778
+ "special": false
779
+ },
780
+ "250094": {
781
+ "content": "▁<extra_id_5>",
782
+ "lstrip": false,
783
+ "normalized": false,
784
+ "rstrip": false,
785
+ "single_word": false,
786
+ "special": false
787
+ },
788
+ "250095": {
789
+ "content": "▁<extra_id_4>",
790
+ "lstrip": false,
791
+ "normalized": false,
792
+ "rstrip": false,
793
+ "single_word": false,
794
+ "special": false
795
+ },
796
+ "250096": {
797
+ "content": "▁<extra_id_3>",
798
+ "lstrip": false,
799
+ "normalized": false,
800
+ "rstrip": false,
801
+ "single_word": false,
802
+ "special": false
803
+ },
804
+ "250097": {
805
+ "content": "▁<extra_id_2>",
806
+ "lstrip": false,
807
+ "normalized": false,
808
+ "rstrip": false,
809
+ "single_word": false,
810
+ "special": false
811
+ },
812
+ "250098": {
813
+ "content": "▁<extra_id_1>",
814
+ "lstrip": false,
815
+ "normalized": false,
816
+ "rstrip": false,
817
+ "single_word": false,
818
+ "special": false
819
+ },
820
+ "250099": {
821
+ "content": "▁<extra_id_0>",
822
+ "lstrip": false,
823
+ "normalized": false,
824
+ "rstrip": false,
825
+ "single_word": false,
826
+ "special": false
827
+ }
828
+ },
829
+ "additional_special_tokens": [],
830
+ "clean_up_tokenization_spaces": false,
831
+ "eos_token": "</s>",
832
+ "extra_ids": 0,
833
+ "extra_special_tokens": {},
834
+ "legacy": false,
835
+ "model_max_length": 1000000000000000019884624838656,
836
+ "pad_token": "<pad>",
837
+ "sp_model_kwargs": {},
838
+ "tokenizer_class": "T5Tokenizer",
839
+ "unk_token": "<unk>"
840
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7481c2a5713cb162550b5f02d01415cbac1cb36a3ac1c71b15a86943d7e579ce
3
+ size 5496