gpol13 commited on
Commit
3d6deb7
·
verified ·
1 Parent(s): 70116e4

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -199,4 +199,4 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
199
  [More Information Needed]
200
  ### Framework versions
201
 
202
- - PEFT 0.14.0
 
199
  [More Information Needed]
200
  ### Framework versions
201
 
202
+ - PEFT 0.12.0
adapter_config.json CHANGED
@@ -3,18 +3,15 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Salesforce/codet5-base",
5
  "bias": "none",
6
- "eva_config": null,
7
- "exclude_modules": null,
8
  "fan_in_fan_out": false,
9
  "inference_mode": true,
10
- "init_lora_weights": "gaussian",
11
  "layer_replication": null,
12
  "layers_pattern": null,
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
  "lora_alpha": 16,
16
- "lora_bias": false,
17
- "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
@@ -23,8 +20,10 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
26
  "q",
27
- "v"
28
  ],
29
  "task_type": "SEQ_2_SEQ_LM",
30
  "use_dora": false,
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Salesforce/codet5-base",
5
  "bias": "none",
 
 
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
+ "init_lora_weights": true,
9
  "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
  "lora_alpha": 16,
14
+ "lora_dropout": 0.1,
 
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "o",
24
+ "v",
25
  "q",
26
+ "k"
27
  ],
28
  "task_type": "SEQ_2_SEQ_LM",
29
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8b59853002c861613dfba51f1fbd432af1cf3e216a526b636e631933f3c2439
3
- size 3558888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07c922d4b9b4865f0895cf70990c49e7458cb3c5ac4e1b5b0b72a774b7514d4b
3
+ size 7117824
checkpoint-9213/README.md ADDED
@@ -0,0 +1,202 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: Salesforce/codet5-base
3
+ library_name: peft
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Funded by [optional]:** [More Information Needed]
22
+ - **Shared by [optional]:** [More Information Needed]
23
+ - **Model type:** [More Information Needed]
24
+ - **Language(s) (NLP):** [More Information Needed]
25
+ - **License:** [More Information Needed]
26
+ - **Finetuned from model [optional]:** [More Information Needed]
27
+
28
+ ### Model Sources [optional]
29
+
30
+ <!-- Provide the basic links for the model. -->
31
+
32
+ - **Repository:** [More Information Needed]
33
+ - **Paper [optional]:** [More Information Needed]
34
+ - **Demo [optional]:** [More Information Needed]
35
+
36
+ ## Uses
37
+
38
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
39
+
40
+ ### Direct Use
41
+
42
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
43
+
44
+ [More Information Needed]
45
+
46
+ ### Downstream Use [optional]
47
+
48
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Out-of-Scope Use
53
+
54
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
55
+
56
+ [More Information Needed]
57
+
58
+ ## Bias, Risks, and Limitations
59
+
60
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ### Recommendations
65
+
66
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
67
+
68
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
69
+
70
+ ## How to Get Started with the Model
71
+
72
+ Use the code below to get started with the model.
73
+
74
+ [More Information Needed]
75
+
76
+ ## Training Details
77
+
78
+ ### Training Data
79
+
80
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
81
+
82
+ [More Information Needed]
83
+
84
+ ### Training Procedure
85
+
86
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
87
+
88
+ #### Preprocessing [optional]
89
+
90
+ [More Information Needed]
91
+
92
+
93
+ #### Training Hyperparameters
94
+
95
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
96
+
97
+ #### Speeds, Sizes, Times [optional]
98
+
99
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
100
+
101
+ [More Information Needed]
102
+
103
+ ## Evaluation
104
+
105
+ <!-- This section describes the evaluation protocols and provides the results. -->
106
+
107
+ ### Testing Data, Factors & Metrics
108
+
109
+ #### Testing Data
110
+
111
+ <!-- This should link to a Dataset Card if possible. -->
112
+
113
+ [More Information Needed]
114
+
115
+ #### Factors
116
+
117
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Metrics
122
+
123
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
124
+
125
+ [More Information Needed]
126
+
127
+ ### Results
128
+
129
+ [More Information Needed]
130
+
131
+ #### Summary
132
+
133
+
134
+
135
+ ## Model Examination [optional]
136
+
137
+ <!-- Relevant interpretability work for the model goes here -->
138
+
139
+ [More Information Needed]
140
+
141
+ ## Environmental Impact
142
+
143
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
144
+
145
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
146
+
147
+ - **Hardware Type:** [More Information Needed]
148
+ - **Hours used:** [More Information Needed]
149
+ - **Cloud Provider:** [More Information Needed]
150
+ - **Compute Region:** [More Information Needed]
151
+ - **Carbon Emitted:** [More Information Needed]
152
+
153
+ ## Technical Specifications [optional]
154
+
155
+ ### Model Architecture and Objective
156
+
157
+ [More Information Needed]
158
+
159
+ ### Compute Infrastructure
160
+
161
+ [More Information Needed]
162
+
163
+ #### Hardware
164
+
165
+ [More Information Needed]
166
+
167
+ #### Software
168
+
169
+ [More Information Needed]
170
+
171
+ ## Citation [optional]
172
+
173
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
174
+
175
+ **BibTeX:**
176
+
177
+ [More Information Needed]
178
+
179
+ **APA:**
180
+
181
+ [More Information Needed]
182
+
183
+ ## Glossary [optional]
184
+
185
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
186
+
187
+ [More Information Needed]
188
+
189
+ ## More Information [optional]
190
+
191
+ [More Information Needed]
192
+
193
+ ## Model Card Authors [optional]
194
+
195
+ [More Information Needed]
196
+
197
+ ## Model Card Contact
198
+
199
+ [More Information Needed]
200
+ ### Framework versions
201
+
202
+ - PEFT 0.12.0
checkpoint-9213/adapter_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "Salesforce/codet5-base",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layer_replication": null,
10
+ "layers_pattern": null,
11
+ "layers_to_transform": null,
12
+ "loftq_config": {},
13
+ "lora_alpha": 16,
14
+ "lora_dropout": 0.1,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
+ "modules_to_save": null,
18
+ "peft_type": "LORA",
19
+ "r": 8,
20
+ "rank_pattern": {},
21
+ "revision": null,
22
+ "target_modules": [
23
+ "o",
24
+ "v",
25
+ "q",
26
+ "k"
27
+ ],
28
+ "task_type": "SEQ_2_SEQ_LM",
29
+ "use_dora": false,
30
+ "use_rslora": false
31
+ }
checkpoint-9213/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07c922d4b9b4865f0895cf70990c49e7458cb3c5ac4e1b5b0b72a774b7514d4b
3
+ size 7117824
checkpoint-9213/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8697ac1d3dba5f15118a269ae29435a8fbe2ace44928ccfb9668f1c1effd0a86
3
+ size 14397434
checkpoint-9213/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be754dba0c3662c12f8b07c5fd72ef60160e13708e25173bb6b57ab26d1fc1b8
3
+ size 14244
checkpoint-9213/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c3840dc5bc85d985597878966f3c7b1f7ee99e5918ecbab8150afe4175ab029
3
+ size 1064
checkpoint-9213/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-9213/tokenizer_config.json ADDED
@@ -0,0 +1,719 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "additional_special_tokens": [
4
+ {
5
+ "content": "<extra_id_99>",
6
+ "lstrip": true,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ {
12
+ "content": "<extra_id_98>",
13
+ "lstrip": true,
14
+ "normalized": true,
15
+ "rstrip": false,
16
+ "single_word": false
17
+ },
18
+ {
19
+ "content": "<extra_id_97>",
20
+ "lstrip": true,
21
+ "normalized": true,
22
+ "rstrip": false,
23
+ "single_word": false
24
+ },
25
+ {
26
+ "content": "<extra_id_96>",
27
+ "lstrip": true,
28
+ "normalized": true,
29
+ "rstrip": false,
30
+ "single_word": false
31
+ },
32
+ {
33
+ "content": "<extra_id_95>",
34
+ "lstrip": true,
35
+ "normalized": true,
36
+ "rstrip": false,
37
+ "single_word": false
38
+ },
39
+ {
40
+ "content": "<extra_id_94>",
41
+ "lstrip": true,
42
+ "normalized": true,
43
+ "rstrip": false,
44
+ "single_word": false
45
+ },
46
+ {
47
+ "content": "<extra_id_93>",
48
+ "lstrip": true,
49
+ "normalized": true,
50
+ "rstrip": false,
51
+ "single_word": false
52
+ },
53
+ {
54
+ "content": "<extra_id_92>",
55
+ "lstrip": true,
56
+ "normalized": true,
57
+ "rstrip": false,
58
+ "single_word": false
59
+ },
60
+ {
61
+ "content": "<extra_id_91>",
62
+ "lstrip": true,
63
+ "normalized": true,
64
+ "rstrip": false,
65
+ "single_word": false
66
+ },
67
+ {
68
+ "content": "<extra_id_90>",
69
+ "lstrip": true,
70
+ "normalized": true,
71
+ "rstrip": false,
72
+ "single_word": false
73
+ },
74
+ {
75
+ "content": "<extra_id_89>",
76
+ "lstrip": true,
77
+ "normalized": true,
78
+ "rstrip": false,
79
+ "single_word": false
80
+ },
81
+ {
82
+ "content": "<extra_id_88>",
83
+ "lstrip": true,
84
+ "normalized": true,
85
+ "rstrip": false,
86
+ "single_word": false
87
+ },
88
+ {
89
+ "content": "<extra_id_87>",
90
+ "lstrip": true,
91
+ "normalized": true,
92
+ "rstrip": false,
93
+ "single_word": false
94
+ },
95
+ {
96
+ "content": "<extra_id_86>",
97
+ "lstrip": true,
98
+ "normalized": true,
99
+ "rstrip": false,
100
+ "single_word": false
101
+ },
102
+ {
103
+ "content": "<extra_id_85>",
104
+ "lstrip": true,
105
+ "normalized": true,
106
+ "rstrip": false,
107
+ "single_word": false
108
+ },
109
+ {
110
+ "content": "<extra_id_84>",
111
+ "lstrip": true,
112
+ "normalized": true,
113
+ "rstrip": false,
114
+ "single_word": false
115
+ },
116
+ {
117
+ "content": "<extra_id_83>",
118
+ "lstrip": true,
119
+ "normalized": true,
120
+ "rstrip": false,
121
+ "single_word": false
122
+ },
123
+ {
124
+ "content": "<extra_id_82>",
125
+ "lstrip": true,
126
+ "normalized": true,
127
+ "rstrip": false,
128
+ "single_word": false
129
+ },
130
+ {
131
+ "content": "<extra_id_81>",
132
+ "lstrip": true,
133
+ "normalized": true,
134
+ "rstrip": false,
135
+ "single_word": false
136
+ },
137
+ {
138
+ "content": "<extra_id_80>",
139
+ "lstrip": true,
140
+ "normalized": true,
141
+ "rstrip": false,
142
+ "single_word": false
143
+ },
144
+ {
145
+ "content": "<extra_id_79>",
146
+ "lstrip": true,
147
+ "normalized": true,
148
+ "rstrip": false,
149
+ "single_word": false
150
+ },
151
+ {
152
+ "content": "<extra_id_78>",
153
+ "lstrip": true,
154
+ "normalized": true,
155
+ "rstrip": false,
156
+ "single_word": false
157
+ },
158
+ {
159
+ "content": "<extra_id_77>",
160
+ "lstrip": true,
161
+ "normalized": true,
162
+ "rstrip": false,
163
+ "single_word": false
164
+ },
165
+ {
166
+ "content": "<extra_id_76>",
167
+ "lstrip": true,
168
+ "normalized": true,
169
+ "rstrip": false,
170
+ "single_word": false
171
+ },
172
+ {
173
+ "content": "<extra_id_75>",
174
+ "lstrip": true,
175
+ "normalized": true,
176
+ "rstrip": false,
177
+ "single_word": false
178
+ },
179
+ {
180
+ "content": "<extra_id_74>",
181
+ "lstrip": true,
182
+ "normalized": true,
183
+ "rstrip": false,
184
+ "single_word": false
185
+ },
186
+ {
187
+ "content": "<extra_id_73>",
188
+ "lstrip": true,
189
+ "normalized": true,
190
+ "rstrip": false,
191
+ "single_word": false
192
+ },
193
+ {
194
+ "content": "<extra_id_72>",
195
+ "lstrip": true,
196
+ "normalized": true,
197
+ "rstrip": false,
198
+ "single_word": false
199
+ },
200
+ {
201
+ "content": "<extra_id_71>",
202
+ "lstrip": true,
203
+ "normalized": true,
204
+ "rstrip": false,
205
+ "single_word": false
206
+ },
207
+ {
208
+ "content": "<extra_id_70>",
209
+ "lstrip": true,
210
+ "normalized": true,
211
+ "rstrip": false,
212
+ "single_word": false
213
+ },
214
+ {
215
+ "content": "<extra_id_69>",
216
+ "lstrip": true,
217
+ "normalized": true,
218
+ "rstrip": false,
219
+ "single_word": false
220
+ },
221
+ {
222
+ "content": "<extra_id_68>",
223
+ "lstrip": true,
224
+ "normalized": true,
225
+ "rstrip": false,
226
+ "single_word": false
227
+ },
228
+ {
229
+ "content": "<extra_id_67>",
230
+ "lstrip": true,
231
+ "normalized": true,
232
+ "rstrip": false,
233
+ "single_word": false
234
+ },
235
+ {
236
+ "content": "<extra_id_66>",
237
+ "lstrip": true,
238
+ "normalized": true,
239
+ "rstrip": false,
240
+ "single_word": false
241
+ },
242
+ {
243
+ "content": "<extra_id_65>",
244
+ "lstrip": true,
245
+ "normalized": true,
246
+ "rstrip": false,
247
+ "single_word": false
248
+ },
249
+ {
250
+ "content": "<extra_id_64>",
251
+ "lstrip": true,
252
+ "normalized": true,
253
+ "rstrip": false,
254
+ "single_word": false
255
+ },
256
+ {
257
+ "content": "<extra_id_63>",
258
+ "lstrip": true,
259
+ "normalized": true,
260
+ "rstrip": false,
261
+ "single_word": false
262
+ },
263
+ {
264
+ "content": "<extra_id_62>",
265
+ "lstrip": true,
266
+ "normalized": true,
267
+ "rstrip": false,
268
+ "single_word": false
269
+ },
270
+ {
271
+ "content": "<extra_id_61>",
272
+ "lstrip": true,
273
+ "normalized": true,
274
+ "rstrip": false,
275
+ "single_word": false
276
+ },
277
+ {
278
+ "content": "<extra_id_60>",
279
+ "lstrip": true,
280
+ "normalized": true,
281
+ "rstrip": false,
282
+ "single_word": false
283
+ },
284
+ {
285
+ "content": "<extra_id_59>",
286
+ "lstrip": true,
287
+ "normalized": true,
288
+ "rstrip": false,
289
+ "single_word": false
290
+ },
291
+ {
292
+ "content": "<extra_id_58>",
293
+ "lstrip": true,
294
+ "normalized": true,
295
+ "rstrip": false,
296
+ "single_word": false
297
+ },
298
+ {
299
+ "content": "<extra_id_57>",
300
+ "lstrip": true,
301
+ "normalized": true,
302
+ "rstrip": false,
303
+ "single_word": false
304
+ },
305
+ {
306
+ "content": "<extra_id_56>",
307
+ "lstrip": true,
308
+ "normalized": true,
309
+ "rstrip": false,
310
+ "single_word": false
311
+ },
312
+ {
313
+ "content": "<extra_id_55>",
314
+ "lstrip": true,
315
+ "normalized": true,
316
+ "rstrip": false,
317
+ "single_word": false
318
+ },
319
+ {
320
+ "content": "<extra_id_54>",
321
+ "lstrip": true,
322
+ "normalized": true,
323
+ "rstrip": false,
324
+ "single_word": false
325
+ },
326
+ {
327
+ "content": "<extra_id_53>",
328
+ "lstrip": true,
329
+ "normalized": true,
330
+ "rstrip": false,
331
+ "single_word": false
332
+ },
333
+ {
334
+ "content": "<extra_id_52>",
335
+ "lstrip": true,
336
+ "normalized": true,
337
+ "rstrip": false,
338
+ "single_word": false
339
+ },
340
+ {
341
+ "content": "<extra_id_51>",
342
+ "lstrip": true,
343
+ "normalized": true,
344
+ "rstrip": false,
345
+ "single_word": false
346
+ },
347
+ {
348
+ "content": "<extra_id_50>",
349
+ "lstrip": true,
350
+ "normalized": true,
351
+ "rstrip": false,
352
+ "single_word": false
353
+ },
354
+ {
355
+ "content": "<extra_id_49>",
356
+ "lstrip": true,
357
+ "normalized": true,
358
+ "rstrip": false,
359
+ "single_word": false
360
+ },
361
+ {
362
+ "content": "<extra_id_48>",
363
+ "lstrip": true,
364
+ "normalized": true,
365
+ "rstrip": false,
366
+ "single_word": false
367
+ },
368
+ {
369
+ "content": "<extra_id_47>",
370
+ "lstrip": true,
371
+ "normalized": true,
372
+ "rstrip": false,
373
+ "single_word": false
374
+ },
375
+ {
376
+ "content": "<extra_id_46>",
377
+ "lstrip": true,
378
+ "normalized": true,
379
+ "rstrip": false,
380
+ "single_word": false
381
+ },
382
+ {
383
+ "content": "<extra_id_45>",
384
+ "lstrip": true,
385
+ "normalized": true,
386
+ "rstrip": false,
387
+ "single_word": false
388
+ },
389
+ {
390
+ "content": "<extra_id_44>",
391
+ "lstrip": true,
392
+ "normalized": true,
393
+ "rstrip": false,
394
+ "single_word": false
395
+ },
396
+ {
397
+ "content": "<extra_id_43>",
398
+ "lstrip": true,
399
+ "normalized": true,
400
+ "rstrip": false,
401
+ "single_word": false
402
+ },
403
+ {
404
+ "content": "<extra_id_42>",
405
+ "lstrip": true,
406
+ "normalized": true,
407
+ "rstrip": false,
408
+ "single_word": false
409
+ },
410
+ {
411
+ "content": "<extra_id_41>",
412
+ "lstrip": true,
413
+ "normalized": true,
414
+ "rstrip": false,
415
+ "single_word": false
416
+ },
417
+ {
418
+ "content": "<extra_id_40>",
419
+ "lstrip": true,
420
+ "normalized": true,
421
+ "rstrip": false,
422
+ "single_word": false
423
+ },
424
+ {
425
+ "content": "<extra_id_39>",
426
+ "lstrip": true,
427
+ "normalized": true,
428
+ "rstrip": false,
429
+ "single_word": false
430
+ },
431
+ {
432
+ "content": "<extra_id_38>",
433
+ "lstrip": true,
434
+ "normalized": true,
435
+ "rstrip": false,
436
+ "single_word": false
437
+ },
438
+ {
439
+ "content": "<extra_id_37>",
440
+ "lstrip": true,
441
+ "normalized": true,
442
+ "rstrip": false,
443
+ "single_word": false
444
+ },
445
+ {
446
+ "content": "<extra_id_36>",
447
+ "lstrip": true,
448
+ "normalized": true,
449
+ "rstrip": false,
450
+ "single_word": false
451
+ },
452
+ {
453
+ "content": "<extra_id_35>",
454
+ "lstrip": true,
455
+ "normalized": true,
456
+ "rstrip": false,
457
+ "single_word": false
458
+ },
459
+ {
460
+ "content": "<extra_id_34>",
461
+ "lstrip": true,
462
+ "normalized": true,
463
+ "rstrip": false,
464
+ "single_word": false
465
+ },
466
+ {
467
+ "content": "<extra_id_33>",
468
+ "lstrip": true,
469
+ "normalized": true,
470
+ "rstrip": false,
471
+ "single_word": false
472
+ },
473
+ {
474
+ "content": "<extra_id_32>",
475
+ "lstrip": true,
476
+ "normalized": true,
477
+ "rstrip": false,
478
+ "single_word": false
479
+ },
480
+ {
481
+ "content": "<extra_id_31>",
482
+ "lstrip": true,
483
+ "normalized": true,
484
+ "rstrip": false,
485
+ "single_word": false
486
+ },
487
+ {
488
+ "content": "<extra_id_30>",
489
+ "lstrip": true,
490
+ "normalized": true,
491
+ "rstrip": false,
492
+ "single_word": false
493
+ },
494
+ {
495
+ "content": "<extra_id_29>",
496
+ "lstrip": true,
497
+ "normalized": true,
498
+ "rstrip": false,
499
+ "single_word": false
500
+ },
501
+ {
502
+ "content": "<extra_id_28>",
503
+ "lstrip": true,
504
+ "normalized": true,
505
+ "rstrip": false,
506
+ "single_word": false
507
+ },
508
+ {
509
+ "content": "<extra_id_27>",
510
+ "lstrip": true,
511
+ "normalized": true,
512
+ "rstrip": false,
513
+ "single_word": false
514
+ },
515
+ {
516
+ "content": "<extra_id_26>",
517
+ "lstrip": true,
518
+ "normalized": true,
519
+ "rstrip": false,
520
+ "single_word": false
521
+ },
522
+ {
523
+ "content": "<extra_id_25>",
524
+ "lstrip": true,
525
+ "normalized": true,
526
+ "rstrip": false,
527
+ "single_word": false
528
+ },
529
+ {
530
+ "content": "<extra_id_24>",
531
+ "lstrip": true,
532
+ "normalized": true,
533
+ "rstrip": false,
534
+ "single_word": false
535
+ },
536
+ {
537
+ "content": "<extra_id_23>",
538
+ "lstrip": true,
539
+ "normalized": true,
540
+ "rstrip": false,
541
+ "single_word": false
542
+ },
543
+ {
544
+ "content": "<extra_id_22>",
545
+ "lstrip": true,
546
+ "normalized": true,
547
+ "rstrip": false,
548
+ "single_word": false
549
+ },
550
+ {
551
+ "content": "<extra_id_21>",
552
+ "lstrip": true,
553
+ "normalized": true,
554
+ "rstrip": false,
555
+ "single_word": false
556
+ },
557
+ {
558
+ "content": "<extra_id_20>",
559
+ "lstrip": true,
560
+ "normalized": true,
561
+ "rstrip": false,
562
+ "single_word": false
563
+ },
564
+ {
565
+ "content": "<extra_id_19>",
566
+ "lstrip": true,
567
+ "normalized": true,
568
+ "rstrip": false,
569
+ "single_word": false
570
+ },
571
+ {
572
+ "content": "<extra_id_18>",
573
+ "lstrip": true,
574
+ "normalized": true,
575
+ "rstrip": false,
576
+ "single_word": false
577
+ },
578
+ {
579
+ "content": "<extra_id_17>",
580
+ "lstrip": true,
581
+ "normalized": true,
582
+ "rstrip": false,
583
+ "single_word": false
584
+ },
585
+ {
586
+ "content": "<extra_id_16>",
587
+ "lstrip": true,
588
+ "normalized": true,
589
+ "rstrip": false,
590
+ "single_word": false
591
+ },
592
+ {
593
+ "content": "<extra_id_15>",
594
+ "lstrip": true,
595
+ "normalized": true,
596
+ "rstrip": false,
597
+ "single_word": false
598
+ },
599
+ {
600
+ "content": "<extra_id_14>",
601
+ "lstrip": true,
602
+ "normalized": true,
603
+ "rstrip": false,
604
+ "single_word": false
605
+ },
606
+ {
607
+ "content": "<extra_id_13>",
608
+ "lstrip": true,
609
+ "normalized": true,
610
+ "rstrip": false,
611
+ "single_word": false
612
+ },
613
+ {
614
+ "content": "<extra_id_12>",
615
+ "lstrip": true,
616
+ "normalized": true,
617
+ "rstrip": false,
618
+ "single_word": false
619
+ },
620
+ {
621
+ "content": "<extra_id_11>",
622
+ "lstrip": true,
623
+ "normalized": true,
624
+ "rstrip": false,
625
+ "single_word": false
626
+ },
627
+ {
628
+ "content": "<extra_id_10>",
629
+ "lstrip": true,
630
+ "normalized": true,
631
+ "rstrip": false,
632
+ "single_word": false
633
+ },
634
+ {
635
+ "content": "<extra_id_9>",
636
+ "lstrip": true,
637
+ "normalized": true,
638
+ "rstrip": false,
639
+ "single_word": false
640
+ },
641
+ {
642
+ "content": "<extra_id_8>",
643
+ "lstrip": true,
644
+ "normalized": true,
645
+ "rstrip": false,
646
+ "single_word": false
647
+ },
648
+ {
649
+ "content": "<extra_id_7>",
650
+ "lstrip": true,
651
+ "normalized": true,
652
+ "rstrip": false,
653
+ "single_word": false
654
+ },
655
+ {
656
+ "content": "<extra_id_6>",
657
+ "lstrip": true,
658
+ "normalized": true,
659
+ "rstrip": false,
660
+ "single_word": false
661
+ },
662
+ {
663
+ "content": "<extra_id_5>",
664
+ "lstrip": true,
665
+ "normalized": true,
666
+ "rstrip": false,
667
+ "single_word": false
668
+ },
669
+ {
670
+ "content": "<extra_id_4>",
671
+ "lstrip": true,
672
+ "normalized": true,
673
+ "rstrip": false,
674
+ "single_word": false
675
+ },
676
+ {
677
+ "content": "<extra_id_3>",
678
+ "lstrip": true,
679
+ "normalized": true,
680
+ "rstrip": false,
681
+ "single_word": false
682
+ },
683
+ {
684
+ "content": "<extra_id_2>",
685
+ "lstrip": true,
686
+ "normalized": true,
687
+ "rstrip": false,
688
+ "single_word": false
689
+ },
690
+ {
691
+ "content": "<extra_id_1>",
692
+ "lstrip": true,
693
+ "normalized": true,
694
+ "rstrip": false,
695
+ "single_word": false
696
+ },
697
+ {
698
+ "content": "<extra_id_0>",
699
+ "lstrip": true,
700
+ "normalized": true,
701
+ "rstrip": false,
702
+ "single_word": false
703
+ }
704
+ ],
705
+ "backend": "tokenizers",
706
+ "bos_token": "<s>",
707
+ "cls_token": "<s>",
708
+ "eos_token": "</s>",
709
+ "errors": "replace",
710
+ "extra_special_tokens": [],
711
+ "is_local": false,
712
+ "mask_token": "<mask>",
713
+ "model_max_length": 512,
714
+ "pad_token": "<pad>",
715
+ "sep_token": "</s>",
716
+ "tokenizer_class": "RobertaTokenizer",
717
+ "trim_offsets": true,
718
+ "unk_token": "<unk>"
719
+ }
checkpoint-9213/trainer_state.json ADDED
@@ -0,0 +1,1361 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 3.0,
6
+ "eval_steps": 500,
7
+ "global_step": 9213,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.0162813415825464,
14
+ "grad_norm": 1.3991888761520386,
15
+ "learning_rate": 4.973407142081841e-05,
16
+ "loss": 4.4039175415039065,
17
+ "step": 50
18
+ },
19
+ {
20
+ "epoch": 0.0325626831650928,
21
+ "grad_norm": 2.573707342147827,
22
+ "learning_rate": 4.946271572777597e-05,
23
+ "loss": 3.261125183105469,
24
+ "step": 100
25
+ },
26
+ {
27
+ "epoch": 0.04884402474763921,
28
+ "grad_norm": 1.1588261127471924,
29
+ "learning_rate": 4.919136003473353e-05,
30
+ "loss": 2.1376600646972657,
31
+ "step": 150
32
+ },
33
+ {
34
+ "epoch": 0.0651253663301856,
35
+ "grad_norm": 1.4137802124023438,
36
+ "learning_rate": 4.892000434169109e-05,
37
+ "loss": 1.8963032531738282,
38
+ "step": 200
39
+ },
40
+ {
41
+ "epoch": 0.08140670791273201,
42
+ "grad_norm": 1.9414198398590088,
43
+ "learning_rate": 4.8648648648648654e-05,
44
+ "loss": 1.8314729309082032,
45
+ "step": 250
46
+ },
47
+ {
48
+ "epoch": 0.09768804949527841,
49
+ "grad_norm": 1.4838837385177612,
50
+ "learning_rate": 4.837729295560621e-05,
51
+ "loss": 1.7229083251953126,
52
+ "step": 300
53
+ },
54
+ {
55
+ "epoch": 0.11396939107782482,
56
+ "grad_norm": 1.7064085006713867,
57
+ "learning_rate": 4.810593726256377e-05,
58
+ "loss": 1.6793362426757812,
59
+ "step": 350
60
+ },
61
+ {
62
+ "epoch": 0.1302507326603712,
63
+ "grad_norm": 1.4688920974731445,
64
+ "learning_rate": 4.783458156952133e-05,
65
+ "loss": 1.598350067138672,
66
+ "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.14653207424291761,
70
+ "grad_norm": 1.336400032043457,
71
+ "learning_rate": 4.756322587647889e-05,
72
+ "loss": 1.5864486694335938,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.16281341582546402,
77
+ "grad_norm": 1.780544638633728,
78
+ "learning_rate": 4.729187018343645e-05,
79
+ "loss": 1.4491355895996094,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.17909475740801042,
84
+ "grad_norm": 1.9979498386383057,
85
+ "learning_rate": 4.7020514490394014e-05,
86
+ "loss": 1.508986358642578,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.19537609899055683,
91
+ "grad_norm": 2.582775115966797,
92
+ "learning_rate": 4.674915879735157e-05,
93
+ "loss": 1.3531187438964845,
94
+ "step": 600
95
+ },
96
+ {
97
+ "epoch": 0.21165744057310323,
98
+ "grad_norm": 1.9345420598983765,
99
+ "learning_rate": 4.647780310430913e-05,
100
+ "loss": 1.3679487609863281,
101
+ "step": 650
102
+ },
103
+ {
104
+ "epoch": 0.22793878215564964,
105
+ "grad_norm": 1.9719504117965698,
106
+ "learning_rate": 4.620644741126669e-05,
107
+ "loss": 1.324554443359375,
108
+ "step": 700
109
+ },
110
+ {
111
+ "epoch": 0.24422012373819602,
112
+ "grad_norm": 1.7349779605865479,
113
+ "learning_rate": 4.593509171822425e-05,
114
+ "loss": 1.2080127716064453,
115
+ "step": 750
116
+ },
117
+ {
118
+ "epoch": 0.2605014653207424,
119
+ "grad_norm": 2.53094482421875,
120
+ "learning_rate": 4.566373602518181e-05,
121
+ "loss": 1.219000244140625,
122
+ "step": 800
123
+ },
124
+ {
125
+ "epoch": 0.2767828069032888,
126
+ "grad_norm": 2.5429346561431885,
127
+ "learning_rate": 4.5392380332139374e-05,
128
+ "loss": 1.263201675415039,
129
+ "step": 850
130
+ },
131
+ {
132
+ "epoch": 0.29306414848583523,
133
+ "grad_norm": 2.447312831878662,
134
+ "learning_rate": 4.512102463909693e-05,
135
+ "loss": 1.1299581146240234,
136
+ "step": 900
137
+ },
138
+ {
139
+ "epoch": 0.30934549006838163,
140
+ "grad_norm": 2.299469470977783,
141
+ "learning_rate": 4.484966894605449e-05,
142
+ "loss": 1.1863082122802735,
143
+ "step": 950
144
+ },
145
+ {
146
+ "epoch": 0.32562683165092804,
147
+ "grad_norm": 2.7745773792266846,
148
+ "learning_rate": 4.457831325301205e-05,
149
+ "loss": 1.1487353515625,
150
+ "step": 1000
151
+ },
152
+ {
153
+ "epoch": 0.34190817323347444,
154
+ "grad_norm": 2.7474420070648193,
155
+ "learning_rate": 4.430695755996961e-05,
156
+ "loss": 1.1214525604248047,
157
+ "step": 1050
158
+ },
159
+ {
160
+ "epoch": 0.35818951481602085,
161
+ "grad_norm": 2.597487211227417,
162
+ "learning_rate": 4.403560186692717e-05,
163
+ "loss": 1.0956230163574219,
164
+ "step": 1100
165
+ },
166
+ {
167
+ "epoch": 0.37447085639856725,
168
+ "grad_norm": 2.393484354019165,
169
+ "learning_rate": 4.3764246173884733e-05,
170
+ "loss": 1.0677281951904296,
171
+ "step": 1150
172
+ },
173
+ {
174
+ "epoch": 0.39075219798111366,
175
+ "grad_norm": 2.6319406032562256,
176
+ "learning_rate": 4.349289048084229e-05,
177
+ "loss": 1.0166962432861328,
178
+ "step": 1200
179
+ },
180
+ {
181
+ "epoch": 0.40703353956366006,
182
+ "grad_norm": 2.9170615673065186,
183
+ "learning_rate": 4.322153478779985e-05,
184
+ "loss": 0.9722758483886719,
185
+ "step": 1250
186
+ },
187
+ {
188
+ "epoch": 0.42331488114620647,
189
+ "grad_norm": 3.030376672744751,
190
+ "learning_rate": 4.295017909475741e-05,
191
+ "loss": 0.9831496429443359,
192
+ "step": 1300
193
+ },
194
+ {
195
+ "epoch": 0.4395962227287529,
196
+ "grad_norm": 1.9566906690597534,
197
+ "learning_rate": 4.267882340171497e-05,
198
+ "loss": 1.0231520080566405,
199
+ "step": 1350
200
+ },
201
+ {
202
+ "epoch": 0.4558775643112993,
203
+ "grad_norm": 3.1707541942596436,
204
+ "learning_rate": 4.2407467708672534e-05,
205
+ "loss": 0.9151640319824219,
206
+ "step": 1400
207
+ },
208
+ {
209
+ "epoch": 0.4721589058938456,
210
+ "grad_norm": 3.353412628173828,
211
+ "learning_rate": 4.213611201563009e-05,
212
+ "loss": 0.9734893035888672,
213
+ "step": 1450
214
+ },
215
+ {
216
+ "epoch": 0.48844024747639203,
217
+ "grad_norm": 2.1188318729400635,
218
+ "learning_rate": 4.186475632258765e-05,
219
+ "loss": 0.9237932586669921,
220
+ "step": 1500
221
+ },
222
+ {
223
+ "epoch": 0.5047215890589385,
224
+ "grad_norm": 2.6821577548980713,
225
+ "learning_rate": 4.159340062954521e-05,
226
+ "loss": 0.8897212982177735,
227
+ "step": 1550
228
+ },
229
+ {
230
+ "epoch": 0.5210029306414848,
231
+ "grad_norm": 2.135638475418091,
232
+ "learning_rate": 4.132204493650277e-05,
233
+ "loss": 0.9515829467773438,
234
+ "step": 1600
235
+ },
236
+ {
237
+ "epoch": 0.5372842722240313,
238
+ "grad_norm": 2.822666645050049,
239
+ "learning_rate": 4.105068924346033e-05,
240
+ "loss": 0.9121678161621094,
241
+ "step": 1650
242
+ },
243
+ {
244
+ "epoch": 0.5535656138065776,
245
+ "grad_norm": 2.7274110317230225,
246
+ "learning_rate": 4.0779333550417894e-05,
247
+ "loss": 0.9216725158691407,
248
+ "step": 1700
249
+ },
250
+ {
251
+ "epoch": 0.5698469553891241,
252
+ "grad_norm": 2.2153918743133545,
253
+ "learning_rate": 4.050797785737545e-05,
254
+ "loss": 0.9212928009033203,
255
+ "step": 1750
256
+ },
257
+ {
258
+ "epoch": 0.5861282969716705,
259
+ "grad_norm": 2.8363842964172363,
260
+ "learning_rate": 4.023662216433301e-05,
261
+ "loss": 0.8820828247070313,
262
+ "step": 1800
263
+ },
264
+ {
265
+ "epoch": 0.6024096385542169,
266
+ "grad_norm": 3.7503888607025146,
267
+ "learning_rate": 3.996526647129057e-05,
268
+ "loss": 0.8915911865234375,
269
+ "step": 1850
270
+ },
271
+ {
272
+ "epoch": 0.6186909801367633,
273
+ "grad_norm": 2.9024317264556885,
274
+ "learning_rate": 3.969391077824813e-05,
275
+ "loss": 0.8826235961914063,
276
+ "step": 1900
277
+ },
278
+ {
279
+ "epoch": 0.6349723217193096,
280
+ "grad_norm": 2.6529974937438965,
281
+ "learning_rate": 3.942255508520569e-05,
282
+ "loss": 0.7980400085449219,
283
+ "step": 1950
284
+ },
285
+ {
286
+ "epoch": 0.6512536633018561,
287
+ "grad_norm": 2.9299404621124268,
288
+ "learning_rate": 3.9151199392163254e-05,
289
+ "loss": 0.8449476623535156,
290
+ "step": 2000
291
+ },
292
+ {
293
+ "epoch": 0.6675350048844024,
294
+ "grad_norm": 2.36393141746521,
295
+ "learning_rate": 3.887984369912081e-05,
296
+ "loss": 0.8074803161621094,
297
+ "step": 2050
298
+ },
299
+ {
300
+ "epoch": 0.6838163464669489,
301
+ "grad_norm": 3.3569858074188232,
302
+ "learning_rate": 3.860848800607837e-05,
303
+ "loss": 0.7903826141357422,
304
+ "step": 2100
305
+ },
306
+ {
307
+ "epoch": 0.7000976880494952,
308
+ "grad_norm": 2.7112410068511963,
309
+ "learning_rate": 3.833713231303593e-05,
310
+ "loss": 0.7987868499755859,
311
+ "step": 2150
312
+ },
313
+ {
314
+ "epoch": 0.7163790296320417,
315
+ "grad_norm": 2.964090347290039,
316
+ "learning_rate": 3.806577661999349e-05,
317
+ "loss": 0.9639425659179688,
318
+ "step": 2200
319
+ },
320
+ {
321
+ "epoch": 0.732660371214588,
322
+ "grad_norm": 2.48537015914917,
323
+ "learning_rate": 3.7794420926951055e-05,
324
+ "loss": 0.8240141296386718,
325
+ "step": 2250
326
+ },
327
+ {
328
+ "epoch": 0.7489417127971345,
329
+ "grad_norm": 3.37619948387146,
330
+ "learning_rate": 3.7523065233908613e-05,
331
+ "loss": 0.7668092346191406,
332
+ "step": 2300
333
+ },
334
+ {
335
+ "epoch": 0.7652230543796809,
336
+ "grad_norm": 3.8201708793640137,
337
+ "learning_rate": 3.725170954086617e-05,
338
+ "loss": 0.8363259887695312,
339
+ "step": 2350
340
+ },
341
+ {
342
+ "epoch": 0.7815043959622273,
343
+ "grad_norm": 2.115691900253296,
344
+ "learning_rate": 3.698035384782373e-05,
345
+ "loss": 0.6972411346435546,
346
+ "step": 2400
347
+ },
348
+ {
349
+ "epoch": 0.7977857375447737,
350
+ "grad_norm": 3.023482322692871,
351
+ "learning_rate": 3.670899815478129e-05,
352
+ "loss": 0.7648641967773437,
353
+ "step": 2450
354
+ },
355
+ {
356
+ "epoch": 0.8140670791273201,
357
+ "grad_norm": 2.759094715118408,
358
+ "learning_rate": 3.643764246173885e-05,
359
+ "loss": 0.7846918487548828,
360
+ "step": 2500
361
+ },
362
+ {
363
+ "epoch": 0.8303484207098665,
364
+ "grad_norm": 2.3906078338623047,
365
+ "learning_rate": 3.6166286768696414e-05,
366
+ "loss": 0.7888090515136719,
367
+ "step": 2550
368
+ },
369
+ {
370
+ "epoch": 0.8466297622924129,
371
+ "grad_norm": 2.275580644607544,
372
+ "learning_rate": 3.589493107565397e-05,
373
+ "loss": 0.751231689453125,
374
+ "step": 2600
375
+ },
376
+ {
377
+ "epoch": 0.8629111038749593,
378
+ "grad_norm": 2.802598237991333,
379
+ "learning_rate": 3.562357538261153e-05,
380
+ "loss": 0.6764369201660156,
381
+ "step": 2650
382
+ },
383
+ {
384
+ "epoch": 0.8791924454575057,
385
+ "grad_norm": 3.350801706314087,
386
+ "learning_rate": 3.535221968956909e-05,
387
+ "loss": 0.7479486083984375,
388
+ "step": 2700
389
+ },
390
+ {
391
+ "epoch": 0.8954737870400521,
392
+ "grad_norm": 2.61865496635437,
393
+ "learning_rate": 3.508086399652665e-05,
394
+ "loss": 0.7227684020996094,
395
+ "step": 2750
396
+ },
397
+ {
398
+ "epoch": 0.9117551286225986,
399
+ "grad_norm": 2.1037511825561523,
400
+ "learning_rate": 3.480950830348421e-05,
401
+ "loss": 0.738468017578125,
402
+ "step": 2800
403
+ },
404
+ {
405
+ "epoch": 0.9280364702051449,
406
+ "grad_norm": 3.354844093322754,
407
+ "learning_rate": 3.4538152610441774e-05,
408
+ "loss": 0.7212671661376953,
409
+ "step": 2850
410
+ },
411
+ {
412
+ "epoch": 0.9443178117876913,
413
+ "grad_norm": 3.2951793670654297,
414
+ "learning_rate": 3.426679691739933e-05,
415
+ "loss": 0.7343311309814453,
416
+ "step": 2900
417
+ },
418
+ {
419
+ "epoch": 0.9605991533702377,
420
+ "grad_norm": 2.4111647605895996,
421
+ "learning_rate": 3.399544122435689e-05,
422
+ "loss": 0.7199324798583985,
423
+ "step": 2950
424
+ },
425
+ {
426
+ "epoch": 0.9768804949527841,
427
+ "grad_norm": 3.4211530685424805,
428
+ "learning_rate": 3.372408553131445e-05,
429
+ "loss": 0.6700502014160157,
430
+ "step": 3000
431
+ },
432
+ {
433
+ "epoch": 0.9931618365353305,
434
+ "grad_norm": 3.150545120239258,
435
+ "learning_rate": 3.345272983827201e-05,
436
+ "loss": 0.7762191009521484,
437
+ "step": 3050
438
+ },
439
+ {
440
+ "epoch": 1.0,
441
+ "eval_bertscore_f1": 0.967131909063726,
442
+ "eval_bleu": 0.6360648795879948,
443
+ "eval_loss": 0.4895643889904022,
444
+ "eval_meteor": 0.7343290842184582,
445
+ "eval_rouge1": 0.8540844780031187,
446
+ "eval_rouge2": 0.7479710009166031,
447
+ "eval_runtime": 123.0031,
448
+ "eval_samples_per_second": 10.504,
449
+ "eval_steps_per_second": 1.317,
450
+ "step": 3071
451
+ },
452
+ {
453
+ "epoch": 1.009443178117877,
454
+ "grad_norm": 3.3871090412139893,
455
+ "learning_rate": 3.318137414522957e-05,
456
+ "loss": 0.6021672821044922,
457
+ "step": 3100
458
+ },
459
+ {
460
+ "epoch": 1.0257245197004232,
461
+ "grad_norm": 3.6125218868255615,
462
+ "learning_rate": 3.291001845218713e-05,
463
+ "loss": 0.5918669891357422,
464
+ "step": 3150
465
+ },
466
+ {
467
+ "epoch": 1.0420058612829697,
468
+ "grad_norm": 3.303037166595459,
469
+ "learning_rate": 3.263866275914469e-05,
470
+ "loss": 0.6978528594970703,
471
+ "step": 3200
472
+ },
473
+ {
474
+ "epoch": 1.0582872028655161,
475
+ "grad_norm": 4.224201202392578,
476
+ "learning_rate": 3.236730706610225e-05,
477
+ "loss": 0.6617731475830078,
478
+ "step": 3250
479
+ },
480
+ {
481
+ "epoch": 1.0745685444480626,
482
+ "grad_norm": 3.4028713703155518,
483
+ "learning_rate": 3.209595137305981e-05,
484
+ "loss": 0.6562766265869141,
485
+ "step": 3300
486
+ },
487
+ {
488
+ "epoch": 1.0908498860306088,
489
+ "grad_norm": 3.408994436264038,
490
+ "learning_rate": 3.182459568001737e-05,
491
+ "loss": 0.6277020263671875,
492
+ "step": 3350
493
+ },
494
+ {
495
+ "epoch": 1.1071312276131553,
496
+ "grad_norm": 2.8505773544311523,
497
+ "learning_rate": 3.155323998697493e-05,
498
+ "loss": 0.6104128646850586,
499
+ "step": 3400
500
+ },
501
+ {
502
+ "epoch": 1.1234125691957018,
503
+ "grad_norm": 3.966662645339966,
504
+ "learning_rate": 3.128188429393249e-05,
505
+ "loss": 0.6578683471679687,
506
+ "step": 3450
507
+ },
508
+ {
509
+ "epoch": 1.1396939107782482,
510
+ "grad_norm": 3.1553022861480713,
511
+ "learning_rate": 3.1010528600890045e-05,
512
+ "loss": 0.6029189300537109,
513
+ "step": 3500
514
+ },
515
+ {
516
+ "epoch": 1.1559752523607945,
517
+ "grad_norm": 2.4723594188690186,
518
+ "learning_rate": 3.0739172907847604e-05,
519
+ "loss": 0.5845599365234375,
520
+ "step": 3550
521
+ },
522
+ {
523
+ "epoch": 1.172256593943341,
524
+ "grad_norm": 3.4956090450286865,
525
+ "learning_rate": 3.0467817214805167e-05,
526
+ "loss": 0.7056507110595703,
527
+ "step": 3600
528
+ },
529
+ {
530
+ "epoch": 1.1885379355258874,
531
+ "grad_norm": 2.530539035797119,
532
+ "learning_rate": 3.0196461521762725e-05,
533
+ "loss": 0.6525007629394531,
534
+ "step": 3650
535
+ },
536
+ {
537
+ "epoch": 1.2048192771084336,
538
+ "grad_norm": 3.184187173843384,
539
+ "learning_rate": 2.992510582872029e-05,
540
+ "loss": 0.6267402267456055,
541
+ "step": 3700
542
+ },
543
+ {
544
+ "epoch": 1.22110061869098,
545
+ "grad_norm": 2.8025341033935547,
546
+ "learning_rate": 2.965375013567785e-05,
547
+ "loss": 0.6082941436767578,
548
+ "step": 3750
549
+ },
550
+ {
551
+ "epoch": 1.2373819602735265,
552
+ "grad_norm": 3.8412115573883057,
553
+ "learning_rate": 2.938239444263541e-05,
554
+ "loss": 0.6256865310668945,
555
+ "step": 3800
556
+ },
557
+ {
558
+ "epoch": 1.253663301856073,
559
+ "grad_norm": 2.749920606613159,
560
+ "learning_rate": 2.9111038749592967e-05,
561
+ "loss": 0.5645497512817382,
562
+ "step": 3850
563
+ },
564
+ {
565
+ "epoch": 1.2699446434386195,
566
+ "grad_norm": 3.3938541412353516,
567
+ "learning_rate": 2.8839683056550526e-05,
568
+ "loss": 0.6264593887329102,
569
+ "step": 3900
570
+ },
571
+ {
572
+ "epoch": 1.2862259850211657,
573
+ "grad_norm": 3.3540456295013428,
574
+ "learning_rate": 2.8568327363508085e-05,
575
+ "loss": 0.6137894821166993,
576
+ "step": 3950
577
+ },
578
+ {
579
+ "epoch": 1.3025073266037122,
580
+ "grad_norm": 2.7908146381378174,
581
+ "learning_rate": 2.829697167046565e-05,
582
+ "loss": 0.6254143142700195,
583
+ "step": 4000
584
+ },
585
+ {
586
+ "epoch": 1.3187886681862586,
587
+ "grad_norm": 2.430589199066162,
588
+ "learning_rate": 2.802561597742321e-05,
589
+ "loss": 0.6473207092285156,
590
+ "step": 4050
591
+ },
592
+ {
593
+ "epoch": 1.3350700097688049,
594
+ "grad_norm": 3.0248193740844727,
595
+ "learning_rate": 2.775426028438077e-05,
596
+ "loss": 0.6663880920410157,
597
+ "step": 4100
598
+ },
599
+ {
600
+ "epoch": 1.3513513513513513,
601
+ "grad_norm": 2.987276077270508,
602
+ "learning_rate": 2.7482904591338327e-05,
603
+ "loss": 0.5809850692749023,
604
+ "step": 4150
605
+ },
606
+ {
607
+ "epoch": 1.3676326929338978,
608
+ "grad_norm": 4.544067859649658,
609
+ "learning_rate": 2.7211548898295886e-05,
610
+ "loss": 0.5767688369750976,
611
+ "step": 4200
612
+ },
613
+ {
614
+ "epoch": 1.3839140345164442,
615
+ "grad_norm": 2.878161907196045,
616
+ "learning_rate": 2.694019320525345e-05,
617
+ "loss": 0.5451320266723633,
618
+ "step": 4250
619
+ },
620
+ {
621
+ "epoch": 1.4001953760989905,
622
+ "grad_norm": 3.9910073280334473,
623
+ "learning_rate": 2.666883751221101e-05,
624
+ "loss": 0.6352932739257813,
625
+ "step": 4300
626
+ },
627
+ {
628
+ "epoch": 1.416476717681537,
629
+ "grad_norm": 2.224102258682251,
630
+ "learning_rate": 2.639748181916857e-05,
631
+ "loss": 0.5719359588623046,
632
+ "step": 4350
633
+ },
634
+ {
635
+ "epoch": 1.4327580592640834,
636
+ "grad_norm": 2.5918033123016357,
637
+ "learning_rate": 2.6126126126126128e-05,
638
+ "loss": 0.5936804962158203,
639
+ "step": 4400
640
+ },
641
+ {
642
+ "epoch": 1.4490394008466296,
643
+ "grad_norm": 3.0837864875793457,
644
+ "learning_rate": 2.5854770433083687e-05,
645
+ "loss": 0.6499692535400391,
646
+ "step": 4450
647
+ },
648
+ {
649
+ "epoch": 1.465320742429176,
650
+ "grad_norm": 4.25653600692749,
651
+ "learning_rate": 2.5583414740041246e-05,
652
+ "loss": 0.5930651092529297,
653
+ "step": 4500
654
+ },
655
+ {
656
+ "epoch": 1.4816020840117226,
657
+ "grad_norm": 2.713430881500244,
658
+ "learning_rate": 2.5312059046998808e-05,
659
+ "loss": 0.5880680847167968,
660
+ "step": 4550
661
+ },
662
+ {
663
+ "epoch": 1.497883425594269,
664
+ "grad_norm": 2.596726417541504,
665
+ "learning_rate": 2.504070335395637e-05,
666
+ "loss": 0.609322280883789,
667
+ "step": 4600
668
+ },
669
+ {
670
+ "epoch": 1.5141647671768155,
671
+ "grad_norm": 5.058499813079834,
672
+ "learning_rate": 2.476934766091393e-05,
673
+ "loss": 0.5476129531860352,
674
+ "step": 4650
675
+ },
676
+ {
677
+ "epoch": 1.530446108759362,
678
+ "grad_norm": 2.4355289936065674,
679
+ "learning_rate": 2.4497991967871488e-05,
680
+ "loss": 0.6133829498291016,
681
+ "step": 4700
682
+ },
683
+ {
684
+ "epoch": 1.5467274503419082,
685
+ "grad_norm": 2.517214298248291,
686
+ "learning_rate": 2.4226636274829047e-05,
687
+ "loss": 0.6106953048706054,
688
+ "step": 4750
689
+ },
690
+ {
691
+ "epoch": 1.5630087919244544,
692
+ "grad_norm": 2.7961008548736572,
693
+ "learning_rate": 2.395528058178661e-05,
694
+ "loss": 0.6070757675170898,
695
+ "step": 4800
696
+ },
697
+ {
698
+ "epoch": 1.5792901335070009,
699
+ "grad_norm": 3.7750861644744873,
700
+ "learning_rate": 2.3683924888744168e-05,
701
+ "loss": 0.611992530822754,
702
+ "step": 4850
703
+ },
704
+ {
705
+ "epoch": 1.5955714750895473,
706
+ "grad_norm": 3.580327033996582,
707
+ "learning_rate": 2.3412569195701726e-05,
708
+ "loss": 0.5429486083984375,
709
+ "step": 4900
710
+ },
711
+ {
712
+ "epoch": 1.6118528166720938,
713
+ "grad_norm": 4.666822910308838,
714
+ "learning_rate": 2.3141213502659285e-05,
715
+ "loss": 0.49008914947509763,
716
+ "step": 4950
717
+ },
718
+ {
719
+ "epoch": 1.6281341582546403,
720
+ "grad_norm": 3.0332093238830566,
721
+ "learning_rate": 2.2869857809616847e-05,
722
+ "loss": 0.49931236267089846,
723
+ "step": 5000
724
+ },
725
+ {
726
+ "epoch": 1.6444154998371867,
727
+ "grad_norm": 2.752690076828003,
728
+ "learning_rate": 2.2598502116574406e-05,
729
+ "loss": 0.5916973876953125,
730
+ "step": 5050
731
+ },
732
+ {
733
+ "epoch": 1.660696841419733,
734
+ "grad_norm": 3.5713531970977783,
735
+ "learning_rate": 2.2327146423531965e-05,
736
+ "loss": 0.5342200469970703,
737
+ "step": 5100
738
+ },
739
+ {
740
+ "epoch": 1.6769781830022794,
741
+ "grad_norm": 2.947326898574829,
742
+ "learning_rate": 2.2055790730489524e-05,
743
+ "loss": 0.48489521026611326,
744
+ "step": 5150
745
+ },
746
+ {
747
+ "epoch": 1.6932595245848256,
748
+ "grad_norm": 3.4723641872406006,
749
+ "learning_rate": 2.1784435037447086e-05,
750
+ "loss": 0.5273918533325195,
751
+ "step": 5200
752
+ },
753
+ {
754
+ "epoch": 1.709540866167372,
755
+ "grad_norm": 3.2168502807617188,
756
+ "learning_rate": 2.1513079344404645e-05,
757
+ "loss": 0.576658935546875,
758
+ "step": 5250
759
+ },
760
+ {
761
+ "epoch": 1.7258222077499186,
762
+ "grad_norm": 3.858649492263794,
763
+ "learning_rate": 2.1241723651362204e-05,
764
+ "loss": 0.5316023254394531,
765
+ "step": 5300
766
+ },
767
+ {
768
+ "epoch": 1.742103549332465,
769
+ "grad_norm": 2.8334648609161377,
770
+ "learning_rate": 2.0970367958319766e-05,
771
+ "loss": 0.5504447555541992,
772
+ "step": 5350
773
+ },
774
+ {
775
+ "epoch": 1.7583848909150115,
776
+ "grad_norm": 4.290432453155518,
777
+ "learning_rate": 2.0699012265277325e-05,
778
+ "loss": 0.47645130157470705,
779
+ "step": 5400
780
+ },
781
+ {
782
+ "epoch": 1.774666232497558,
783
+ "grad_norm": 3.450201988220215,
784
+ "learning_rate": 2.0427656572234887e-05,
785
+ "loss": 0.49983680725097657,
786
+ "step": 5450
787
+ },
788
+ {
789
+ "epoch": 1.7909475740801042,
790
+ "grad_norm": 3.0057594776153564,
791
+ "learning_rate": 2.0156300879192446e-05,
792
+ "loss": 0.5014204025268555,
793
+ "step": 5500
794
+ },
795
+ {
796
+ "epoch": 1.8072289156626506,
797
+ "grad_norm": 2.4749011993408203,
798
+ "learning_rate": 1.9884945186150005e-05,
799
+ "loss": 0.5224055862426757,
800
+ "step": 5550
801
+ },
802
+ {
803
+ "epoch": 1.8235102572451969,
804
+ "grad_norm": 3.564490556716919,
805
+ "learning_rate": 1.9613589493107567e-05,
806
+ "loss": 0.4841350555419922,
807
+ "step": 5600
808
+ },
809
+ {
810
+ "epoch": 1.8397915988277433,
811
+ "grad_norm": 4.468665599822998,
812
+ "learning_rate": 1.9342233800065126e-05,
813
+ "loss": 0.49803077697753906,
814
+ "step": 5650
815
+ },
816
+ {
817
+ "epoch": 1.8560729404102898,
818
+ "grad_norm": 2.853323221206665,
819
+ "learning_rate": 1.9070878107022685e-05,
820
+ "loss": 0.5557261276245117,
821
+ "step": 5700
822
+ },
823
+ {
824
+ "epoch": 1.8723542819928363,
825
+ "grad_norm": 2.240102767944336,
826
+ "learning_rate": 1.8799522413980247e-05,
827
+ "loss": 0.5035658645629882,
828
+ "step": 5750
829
+ },
830
+ {
831
+ "epoch": 1.8886356235753827,
832
+ "grad_norm": 4.524099349975586,
833
+ "learning_rate": 1.8528166720937806e-05,
834
+ "loss": 0.4709853363037109,
835
+ "step": 5800
836
+ },
837
+ {
838
+ "epoch": 1.904916965157929,
839
+ "grad_norm": 3.5889639854431152,
840
+ "learning_rate": 1.8256811027895364e-05,
841
+ "loss": 0.5654364395141601,
842
+ "step": 5850
843
+ },
844
+ {
845
+ "epoch": 1.9211983067404754,
846
+ "grad_norm": 4.631803512573242,
847
+ "learning_rate": 1.7985455334852927e-05,
848
+ "loss": 0.4828892517089844,
849
+ "step": 5900
850
+ },
851
+ {
852
+ "epoch": 1.9374796483230217,
853
+ "grad_norm": 3.324930191040039,
854
+ "learning_rate": 1.7714099641810485e-05,
855
+ "loss": 0.5719730377197265,
856
+ "step": 5950
857
+ },
858
+ {
859
+ "epoch": 1.9537609899055681,
860
+ "grad_norm": 4.518911838531494,
861
+ "learning_rate": 1.7442743948768044e-05,
862
+ "loss": 0.4871857833862305,
863
+ "step": 6000
864
+ },
865
+ {
866
+ "epoch": 1.9700423314881146,
867
+ "grad_norm": 4.349981307983398,
868
+ "learning_rate": 1.7171388255725606e-05,
869
+ "loss": 0.5515385437011718,
870
+ "step": 6050
871
+ },
872
+ {
873
+ "epoch": 1.986323673070661,
874
+ "grad_norm": 3.0791079998016357,
875
+ "learning_rate": 1.6900032562683165e-05,
876
+ "loss": 0.5213652801513672,
877
+ "step": 6100
878
+ },
879
+ {
880
+ "epoch": 2.0,
881
+ "eval_bertscore_f1": 0.9760125298802698,
882
+ "eval_bleu": 0.7369094701809736,
883
+ "eval_loss": 0.36441001296043396,
884
+ "eval_meteor": 0.8127092299374118,
885
+ "eval_rouge1": 0.8875418149898048,
886
+ "eval_rouge2": 0.8077254196229909,
887
+ "eval_runtime": 132.4191,
888
+ "eval_samples_per_second": 9.757,
889
+ "eval_steps_per_second": 1.223,
890
+ "step": 6142
891
+ },
892
+ {
893
+ "epoch": 2.0026050146532075,
894
+ "grad_norm": 1.9988925457000732,
895
+ "learning_rate": 1.6628676869640724e-05,
896
+ "loss": 0.4895309066772461,
897
+ "step": 6150
898
+ },
899
+ {
900
+ "epoch": 2.018886356235754,
901
+ "grad_norm": 3.848978042602539,
902
+ "learning_rate": 1.6357321176598286e-05,
903
+ "loss": 0.5836200714111328,
904
+ "step": 6200
905
+ },
906
+ {
907
+ "epoch": 2.0351676978183004,
908
+ "grad_norm": 3.77553129196167,
909
+ "learning_rate": 1.6085965483555845e-05,
910
+ "loss": 0.5029875564575196,
911
+ "step": 6250
912
+ },
913
+ {
914
+ "epoch": 2.0514490394008464,
915
+ "grad_norm": 3.317784070968628,
916
+ "learning_rate": 1.5814609790513404e-05,
917
+ "loss": 0.4987943649291992,
918
+ "step": 6300
919
+ },
920
+ {
921
+ "epoch": 2.067730380983393,
922
+ "grad_norm": 6.215928554534912,
923
+ "learning_rate": 1.5543254097470966e-05,
924
+ "loss": 0.4729055404663086,
925
+ "step": 6350
926
+ },
927
+ {
928
+ "epoch": 2.0840117225659394,
929
+ "grad_norm": 4.411025524139404,
930
+ "learning_rate": 1.5271898404428525e-05,
931
+ "loss": 0.47504291534423826,
932
+ "step": 6400
933
+ },
934
+ {
935
+ "epoch": 2.100293064148486,
936
+ "grad_norm": 3.878382444381714,
937
+ "learning_rate": 1.5000542711386087e-05,
938
+ "loss": 0.5043264389038086,
939
+ "step": 6450
940
+ },
941
+ {
942
+ "epoch": 2.1165744057310323,
943
+ "grad_norm": 3.332885980606079,
944
+ "learning_rate": 1.4729187018343646e-05,
945
+ "loss": 0.5287798309326172,
946
+ "step": 6500
947
+ },
948
+ {
949
+ "epoch": 2.1328557473135787,
950
+ "grad_norm": 5.045743942260742,
951
+ "learning_rate": 1.4457831325301205e-05,
952
+ "loss": 0.5503104782104492,
953
+ "step": 6550
954
+ },
955
+ {
956
+ "epoch": 2.149137088896125,
957
+ "grad_norm": 4.425091743469238,
958
+ "learning_rate": 1.4186475632258767e-05,
959
+ "loss": 0.5537314224243164,
960
+ "step": 6600
961
+ },
962
+ {
963
+ "epoch": 2.165418430478671,
964
+ "grad_norm": 4.250468730926514,
965
+ "learning_rate": 1.3915119939216326e-05,
966
+ "loss": 0.4960391235351562,
967
+ "step": 6650
968
+ },
969
+ {
970
+ "epoch": 2.1816997720612177,
971
+ "grad_norm": 2.38873028755188,
972
+ "learning_rate": 1.3643764246173885e-05,
973
+ "loss": 0.4847539520263672,
974
+ "step": 6700
975
+ },
976
+ {
977
+ "epoch": 2.197981113643764,
978
+ "grad_norm": 3.1205639839172363,
979
+ "learning_rate": 1.3372408553131447e-05,
980
+ "loss": 0.530453872680664,
981
+ "step": 6750
982
+ },
983
+ {
984
+ "epoch": 2.2142624552263106,
985
+ "grad_norm": 3.130052089691162,
986
+ "learning_rate": 1.3101052860089006e-05,
987
+ "loss": 0.4768033981323242,
988
+ "step": 6800
989
+ },
990
+ {
991
+ "epoch": 2.230543796808857,
992
+ "grad_norm": 2.549163341522217,
993
+ "learning_rate": 1.2829697167046565e-05,
994
+ "loss": 0.5177365493774414,
995
+ "step": 6850
996
+ },
997
+ {
998
+ "epoch": 2.2468251383914035,
999
+ "grad_norm": 3.2036118507385254,
1000
+ "learning_rate": 1.2558341474004127e-05,
1001
+ "loss": 0.48484851837158205,
1002
+ "step": 6900
1003
+ },
1004
+ {
1005
+ "epoch": 2.26310647997395,
1006
+ "grad_norm": 3.249213695526123,
1007
+ "learning_rate": 1.2286985780961686e-05,
1008
+ "loss": 0.5264522933959961,
1009
+ "step": 6950
1010
+ },
1011
+ {
1012
+ "epoch": 2.2793878215564964,
1013
+ "grad_norm": 3.0506670475006104,
1014
+ "learning_rate": 1.2015630087919246e-05,
1015
+ "loss": 0.5557387161254883,
1016
+ "step": 7000
1017
+ },
1018
+ {
1019
+ "epoch": 2.295669163139043,
1020
+ "grad_norm": 4.090348243713379,
1021
+ "learning_rate": 1.1744274394876805e-05,
1022
+ "loss": 0.44691120147705077,
1023
+ "step": 7050
1024
+ },
1025
+ {
1026
+ "epoch": 2.311950504721589,
1027
+ "grad_norm": 4.048130512237549,
1028
+ "learning_rate": 1.1472918701834365e-05,
1029
+ "loss": 0.47702239990234374,
1030
+ "step": 7100
1031
+ },
1032
+ {
1033
+ "epoch": 2.3282318463041354,
1034
+ "grad_norm": 4.8760528564453125,
1035
+ "learning_rate": 1.1201563008791926e-05,
1036
+ "loss": 0.5293217468261718,
1037
+ "step": 7150
1038
+ },
1039
+ {
1040
+ "epoch": 2.344513187886682,
1041
+ "grad_norm": 1.611255407333374,
1042
+ "learning_rate": 1.0930207315749485e-05,
1043
+ "loss": 0.5165376281738281,
1044
+ "step": 7200
1045
+ },
1046
+ {
1047
+ "epoch": 2.3607945294692283,
1048
+ "grad_norm": 3.9336297512054443,
1049
+ "learning_rate": 1.0658851622707045e-05,
1050
+ "loss": 0.5475522232055664,
1051
+ "step": 7250
1052
+ },
1053
+ {
1054
+ "epoch": 2.3770758710517748,
1055
+ "grad_norm": 3.2688589096069336,
1056
+ "learning_rate": 1.0387495929664604e-05,
1057
+ "loss": 0.4639253616333008,
1058
+ "step": 7300
1059
+ },
1060
+ {
1061
+ "epoch": 2.393357212634321,
1062
+ "grad_norm": 2.2077689170837402,
1063
+ "learning_rate": 1.0116140236622165e-05,
1064
+ "loss": 0.49176544189453125,
1065
+ "step": 7350
1066
+ },
1067
+ {
1068
+ "epoch": 2.4096385542168672,
1069
+ "grad_norm": 3.6767163276672363,
1070
+ "learning_rate": 9.844784543579723e-06,
1071
+ "loss": 0.46481277465820314,
1072
+ "step": 7400
1073
+ },
1074
+ {
1075
+ "epoch": 2.4259198957994137,
1076
+ "grad_norm": 2.3092267513275146,
1077
+ "learning_rate": 9.573428850537284e-06,
1078
+ "loss": 0.4961623382568359,
1079
+ "step": 7450
1080
+ },
1081
+ {
1082
+ "epoch": 2.44220123738196,
1083
+ "grad_norm": 2.597843885421753,
1084
+ "learning_rate": 9.302073157494844e-06,
1085
+ "loss": 0.48158348083496094,
1086
+ "step": 7500
1087
+ },
1088
+ {
1089
+ "epoch": 2.4584825789645066,
1090
+ "grad_norm": 3.8426899909973145,
1091
+ "learning_rate": 9.030717464452403e-06,
1092
+ "loss": 0.5378573989868164,
1093
+ "step": 7550
1094
+ },
1095
+ {
1096
+ "epoch": 2.474763920547053,
1097
+ "grad_norm": 3.84844970703125,
1098
+ "learning_rate": 8.759361771409964e-06,
1099
+ "loss": 0.44852672576904296,
1100
+ "step": 7600
1101
+ },
1102
+ {
1103
+ "epoch": 2.4910452621295995,
1104
+ "grad_norm": 1.7561177015304565,
1105
+ "learning_rate": 8.488006078367524e-06,
1106
+ "loss": 0.47510692596435544,
1107
+ "step": 7650
1108
+ },
1109
+ {
1110
+ "epoch": 2.507326603712146,
1111
+ "grad_norm": 3.857144355773926,
1112
+ "learning_rate": 8.216650385325085e-06,
1113
+ "loss": 0.40881168365478515,
1114
+ "step": 7700
1115
+ },
1116
+ {
1117
+ "epoch": 2.5236079452946925,
1118
+ "grad_norm": 3.1903669834136963,
1119
+ "learning_rate": 7.945294692282644e-06,
1120
+ "loss": 0.47881248474121096,
1121
+ "step": 7750
1122
+ },
1123
+ {
1124
+ "epoch": 2.539889286877239,
1125
+ "grad_norm": 5.834493637084961,
1126
+ "learning_rate": 7.673938999240204e-06,
1127
+ "loss": 0.4648504638671875,
1128
+ "step": 7800
1129
+ },
1130
+ {
1131
+ "epoch": 2.556170628459785,
1132
+ "grad_norm": 4.4403252601623535,
1133
+ "learning_rate": 7.402583306197765e-06,
1134
+ "loss": 0.45219791412353516,
1135
+ "step": 7850
1136
+ },
1137
+ {
1138
+ "epoch": 2.5724519700423314,
1139
+ "grad_norm": 3.979234457015991,
1140
+ "learning_rate": 7.1312276131553235e-06,
1141
+ "loss": 0.4795208358764648,
1142
+ "step": 7900
1143
+ },
1144
+ {
1145
+ "epoch": 2.588733311624878,
1146
+ "grad_norm": 7.058864593505859,
1147
+ "learning_rate": 6.859871920112884e-06,
1148
+ "loss": 0.47828922271728513,
1149
+ "step": 7950
1150
+ },
1151
+ {
1152
+ "epoch": 2.6050146532074243,
1153
+ "grad_norm": 2.258791923522949,
1154
+ "learning_rate": 6.5885162270704446e-06,
1155
+ "loss": 0.47586013793945314,
1156
+ "step": 8000
1157
+ },
1158
+ {
1159
+ "epoch": 2.6212959947899708,
1160
+ "grad_norm": 3.1901180744171143,
1161
+ "learning_rate": 6.317160534028005e-06,
1162
+ "loss": 0.42454421997070313,
1163
+ "step": 8050
1164
+ },
1165
+ {
1166
+ "epoch": 2.6375773363725172,
1167
+ "grad_norm": 5.115426540374756,
1168
+ "learning_rate": 6.045804840985564e-06,
1169
+ "loss": 0.478512077331543,
1170
+ "step": 8100
1171
+ },
1172
+ {
1173
+ "epoch": 2.6538586779550632,
1174
+ "grad_norm": 2.2929582595825195,
1175
+ "learning_rate": 5.774449147943124e-06,
1176
+ "loss": 0.5165943527221679,
1177
+ "step": 8150
1178
+ },
1179
+ {
1180
+ "epoch": 2.6701400195376097,
1181
+ "grad_norm": 4.737906455993652,
1182
+ "learning_rate": 5.503093454900684e-06,
1183
+ "loss": 0.5091237640380859,
1184
+ "step": 8200
1185
+ },
1186
+ {
1187
+ "epoch": 2.686421361120156,
1188
+ "grad_norm": 2.8958566188812256,
1189
+ "learning_rate": 5.231737761858245e-06,
1190
+ "loss": 0.5252229690551757,
1191
+ "step": 8250
1192
+ },
1193
+ {
1194
+ "epoch": 2.7027027027027026,
1195
+ "grad_norm": 3.7006046772003174,
1196
+ "learning_rate": 4.960382068815804e-06,
1197
+ "loss": 0.4727284240722656,
1198
+ "step": 8300
1199
+ },
1200
+ {
1201
+ "epoch": 2.718984044285249,
1202
+ "grad_norm": 4.118995189666748,
1203
+ "learning_rate": 4.689026375773364e-06,
1204
+ "loss": 0.5148253631591797,
1205
+ "step": 8350
1206
+ },
1207
+ {
1208
+ "epoch": 2.7352653858677956,
1209
+ "grad_norm": 2.285799980163574,
1210
+ "learning_rate": 4.417670682730924e-06,
1211
+ "loss": 0.47666587829589846,
1212
+ "step": 8400
1213
+ },
1214
+ {
1215
+ "epoch": 2.751546727450342,
1216
+ "grad_norm": 5.824726104736328,
1217
+ "learning_rate": 4.146314989688484e-06,
1218
+ "loss": 0.3846194839477539,
1219
+ "step": 8450
1220
+ },
1221
+ {
1222
+ "epoch": 2.7678280690328885,
1223
+ "grad_norm": 3.3558638095855713,
1224
+ "learning_rate": 3.874959296646044e-06,
1225
+ "loss": 0.47148590087890624,
1226
+ "step": 8500
1227
+ },
1228
+ {
1229
+ "epoch": 2.784109410615435,
1230
+ "grad_norm": 5.155383110046387,
1231
+ "learning_rate": 3.603603603603604e-06,
1232
+ "loss": 0.49628185272216796,
1233
+ "step": 8550
1234
+ },
1235
+ {
1236
+ "epoch": 2.800390752197981,
1237
+ "grad_norm": 2.7732632160186768,
1238
+ "learning_rate": 3.3322479105611635e-06,
1239
+ "loss": 0.4713264465332031,
1240
+ "step": 8600
1241
+ },
1242
+ {
1243
+ "epoch": 2.8166720937805274,
1244
+ "grad_norm": 4.7110066413879395,
1245
+ "learning_rate": 3.0608922175187236e-06,
1246
+ "loss": 0.46566177368164063,
1247
+ "step": 8650
1248
+ },
1249
+ {
1250
+ "epoch": 2.832953435363074,
1251
+ "grad_norm": 3.182767868041992,
1252
+ "learning_rate": 2.7895365244762837e-06,
1253
+ "loss": 0.4322200775146484,
1254
+ "step": 8700
1255
+ },
1256
+ {
1257
+ "epoch": 2.8492347769456203,
1258
+ "grad_norm": 2.3082404136657715,
1259
+ "learning_rate": 2.5181808314338434e-06,
1260
+ "loss": 0.45952880859375,
1261
+ "step": 8750
1262
+ },
1263
+ {
1264
+ "epoch": 2.865516118528167,
1265
+ "grad_norm": 3.0804383754730225,
1266
+ "learning_rate": 2.2468251383914035e-06,
1267
+ "loss": 0.5015320205688476,
1268
+ "step": 8800
1269
+ },
1270
+ {
1271
+ "epoch": 2.8817974601107132,
1272
+ "grad_norm": 2.3712687492370605,
1273
+ "learning_rate": 1.9754694453489636e-06,
1274
+ "loss": 0.46776729583740234,
1275
+ "step": 8850
1276
+ },
1277
+ {
1278
+ "epoch": 2.8980788016932593,
1279
+ "grad_norm": 3.109934091567993,
1280
+ "learning_rate": 1.7041137523065235e-06,
1281
+ "loss": 0.4564864349365234,
1282
+ "step": 8900
1283
+ },
1284
+ {
1285
+ "epoch": 2.9143601432758057,
1286
+ "grad_norm": 5.136889934539795,
1287
+ "learning_rate": 1.4327580592640834e-06,
1288
+ "loss": 0.4858356857299805,
1289
+ "step": 8950
1290
+ },
1291
+ {
1292
+ "epoch": 2.930641484858352,
1293
+ "grad_norm": 5.105923175811768,
1294
+ "learning_rate": 1.1614023662216434e-06,
1295
+ "loss": 0.44804500579833983,
1296
+ "step": 9000
1297
+ },
1298
+ {
1299
+ "epoch": 2.9469228264408986,
1300
+ "grad_norm": 2.8601877689361572,
1301
+ "learning_rate": 8.900466731792033e-07,
1302
+ "loss": 0.42105804443359374,
1303
+ "step": 9050
1304
+ },
1305
+ {
1306
+ "epoch": 2.963204168023445,
1307
+ "grad_norm": 2.99465012550354,
1308
+ "learning_rate": 6.186909801367633e-07,
1309
+ "loss": 0.39937313079833986,
1310
+ "step": 9100
1311
+ },
1312
+ {
1313
+ "epoch": 2.9794855096059916,
1314
+ "grad_norm": 1.473414421081543,
1315
+ "learning_rate": 3.4733528709432325e-07,
1316
+ "loss": 0.43089988708496096,
1317
+ "step": 9150
1318
+ },
1319
+ {
1320
+ "epoch": 2.995766851188538,
1321
+ "grad_norm": 3.2104876041412354,
1322
+ "learning_rate": 7.597959405188321e-08,
1323
+ "loss": 0.48259429931640624,
1324
+ "step": 9200
1325
+ },
1326
+ {
1327
+ "epoch": 3.0,
1328
+ "eval_bertscore_f1": 0.9784284891912443,
1329
+ "eval_bleu": 0.7639446756702927,
1330
+ "eval_loss": 0.33530932664871216,
1331
+ "eval_meteor": 0.8315404974609083,
1332
+ "eval_rouge1": 0.8979837043455776,
1333
+ "eval_rouge2": 0.8245087404389784,
1334
+ "eval_runtime": 131.767,
1335
+ "eval_samples_per_second": 9.805,
1336
+ "eval_steps_per_second": 1.229,
1337
+ "step": 9213
1338
+ }
1339
+ ],
1340
+ "logging_steps": 50,
1341
+ "max_steps": 9213,
1342
+ "num_input_tokens_seen": 0,
1343
+ "num_train_epochs": 3,
1344
+ "save_steps": 500,
1345
+ "stateful_callbacks": {
1346
+ "TrainerControl": {
1347
+ "args": {
1348
+ "should_epoch_stop": false,
1349
+ "should_evaluate": false,
1350
+ "should_log": false,
1351
+ "should_save": true,
1352
+ "should_training_stop": true
1353
+ },
1354
+ "attributes": {}
1355
+ }
1356
+ },
1357
+ "total_flos": 2.263887217557504e+16,
1358
+ "train_batch_size": 8,
1359
+ "trial_name": null,
1360
+ "trial_params": null
1361
+ }
checkpoint-9213/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21e7988a724f50ab4d65854a8bd4de7b4eceb713886a6a05ceeaeae7fb11b713
3
+ size 4920
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 128,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 128
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
@@ -61,906 +61,6 @@
61
  "rstrip": false,
62
  "normalized": true,
63
  "special": true
64
- },
65
- {
66
- "id": 32000,
67
- "content": "<extra_id_99>",
68
- "single_word": false,
69
- "lstrip": true,
70
- "rstrip": false,
71
- "normalized": true,
72
- "special": true
73
- },
74
- {
75
- "id": 32001,
76
- "content": "<extra_id_98>",
77
- "single_word": false,
78
- "lstrip": true,
79
- "rstrip": false,
80
- "normalized": true,
81
- "special": true
82
- },
83
- {
84
- "id": 32002,
85
- "content": "<extra_id_97>",
86
- "single_word": false,
87
- "lstrip": true,
88
- "rstrip": false,
89
- "normalized": true,
90
- "special": true
91
- },
92
- {
93
- "id": 32003,
94
- "content": "<extra_id_96>",
95
- "single_word": false,
96
- "lstrip": true,
97
- "rstrip": false,
98
- "normalized": true,
99
- "special": true
100
- },
101
- {
102
- "id": 32004,
103
- "content": "<extra_id_95>",
104
- "single_word": false,
105
- "lstrip": true,
106
- "rstrip": false,
107
- "normalized": true,
108
- "special": true
109
- },
110
- {
111
- "id": 32005,
112
- "content": "<extra_id_94>",
113
- "single_word": false,
114
- "lstrip": true,
115
- "rstrip": false,
116
- "normalized": true,
117
- "special": true
118
- },
119
- {
120
- "id": 32006,
121
- "content": "<extra_id_93>",
122
- "single_word": false,
123
- "lstrip": true,
124
- "rstrip": false,
125
- "normalized": true,
126
- "special": true
127
- },
128
- {
129
- "id": 32007,
130
- "content": "<extra_id_92>",
131
- "single_word": false,
132
- "lstrip": true,
133
- "rstrip": false,
134
- "normalized": true,
135
- "special": true
136
- },
137
- {
138
- "id": 32008,
139
- "content": "<extra_id_91>",
140
- "single_word": false,
141
- "lstrip": true,
142
- "rstrip": false,
143
- "normalized": true,
144
- "special": true
145
- },
146
- {
147
- "id": 32009,
148
- "content": "<extra_id_90>",
149
- "single_word": false,
150
- "lstrip": true,
151
- "rstrip": false,
152
- "normalized": true,
153
- "special": true
154
- },
155
- {
156
- "id": 32010,
157
- "content": "<extra_id_89>",
158
- "single_word": false,
159
- "lstrip": true,
160
- "rstrip": false,
161
- "normalized": true,
162
- "special": true
163
- },
164
- {
165
- "id": 32011,
166
- "content": "<extra_id_88>",
167
- "single_word": false,
168
- "lstrip": true,
169
- "rstrip": false,
170
- "normalized": true,
171
- "special": true
172
- },
173
- {
174
- "id": 32012,
175
- "content": "<extra_id_87>",
176
- "single_word": false,
177
- "lstrip": true,
178
- "rstrip": false,
179
- "normalized": true,
180
- "special": true
181
- },
182
- {
183
- "id": 32013,
184
- "content": "<extra_id_86>",
185
- "single_word": false,
186
- "lstrip": true,
187
- "rstrip": false,
188
- "normalized": true,
189
- "special": true
190
- },
191
- {
192
- "id": 32014,
193
- "content": "<extra_id_85>",
194
- "single_word": false,
195
- "lstrip": true,
196
- "rstrip": false,
197
- "normalized": true,
198
- "special": true
199
- },
200
- {
201
- "id": 32015,
202
- "content": "<extra_id_84>",
203
- "single_word": false,
204
- "lstrip": true,
205
- "rstrip": false,
206
- "normalized": true,
207
- "special": true
208
- },
209
- {
210
- "id": 32016,
211
- "content": "<extra_id_83>",
212
- "single_word": false,
213
- "lstrip": true,
214
- "rstrip": false,
215
- "normalized": true,
216
- "special": true
217
- },
218
- {
219
- "id": 32017,
220
- "content": "<extra_id_82>",
221
- "single_word": false,
222
- "lstrip": true,
223
- "rstrip": false,
224
- "normalized": true,
225
- "special": true
226
- },
227
- {
228
- "id": 32018,
229
- "content": "<extra_id_81>",
230
- "single_word": false,
231
- "lstrip": true,
232
- "rstrip": false,
233
- "normalized": true,
234
- "special": true
235
- },
236
- {
237
- "id": 32019,
238
- "content": "<extra_id_80>",
239
- "single_word": false,
240
- "lstrip": true,
241
- "rstrip": false,
242
- "normalized": true,
243
- "special": true
244
- },
245
- {
246
- "id": 32020,
247
- "content": "<extra_id_79>",
248
- "single_word": false,
249
- "lstrip": true,
250
- "rstrip": false,
251
- "normalized": true,
252
- "special": true
253
- },
254
- {
255
- "id": 32021,
256
- "content": "<extra_id_78>",
257
- "single_word": false,
258
- "lstrip": true,
259
- "rstrip": false,
260
- "normalized": true,
261
- "special": true
262
- },
263
- {
264
- "id": 32022,
265
- "content": "<extra_id_77>",
266
- "single_word": false,
267
- "lstrip": true,
268
- "rstrip": false,
269
- "normalized": true,
270
- "special": true
271
- },
272
- {
273
- "id": 32023,
274
- "content": "<extra_id_76>",
275
- "single_word": false,
276
- "lstrip": true,
277
- "rstrip": false,
278
- "normalized": true,
279
- "special": true
280
- },
281
- {
282
- "id": 32024,
283
- "content": "<extra_id_75>",
284
- "single_word": false,
285
- "lstrip": true,
286
- "rstrip": false,
287
- "normalized": true,
288
- "special": true
289
- },
290
- {
291
- "id": 32025,
292
- "content": "<extra_id_74>",
293
- "single_word": false,
294
- "lstrip": true,
295
- "rstrip": false,
296
- "normalized": true,
297
- "special": true
298
- },
299
- {
300
- "id": 32026,
301
- "content": "<extra_id_73>",
302
- "single_word": false,
303
- "lstrip": true,
304
- "rstrip": false,
305
- "normalized": true,
306
- "special": true
307
- },
308
- {
309
- "id": 32027,
310
- "content": "<extra_id_72>",
311
- "single_word": false,
312
- "lstrip": true,
313
- "rstrip": false,
314
- "normalized": true,
315
- "special": true
316
- },
317
- {
318
- "id": 32028,
319
- "content": "<extra_id_71>",
320
- "single_word": false,
321
- "lstrip": true,
322
- "rstrip": false,
323
- "normalized": true,
324
- "special": true
325
- },
326
- {
327
- "id": 32029,
328
- "content": "<extra_id_70>",
329
- "single_word": false,
330
- "lstrip": true,
331
- "rstrip": false,
332
- "normalized": true,
333
- "special": true
334
- },
335
- {
336
- "id": 32030,
337
- "content": "<extra_id_69>",
338
- "single_word": false,
339
- "lstrip": true,
340
- "rstrip": false,
341
- "normalized": true,
342
- "special": true
343
- },
344
- {
345
- "id": 32031,
346
- "content": "<extra_id_68>",
347
- "single_word": false,
348
- "lstrip": true,
349
- "rstrip": false,
350
- "normalized": true,
351
- "special": true
352
- },
353
- {
354
- "id": 32032,
355
- "content": "<extra_id_67>",
356
- "single_word": false,
357
- "lstrip": true,
358
- "rstrip": false,
359
- "normalized": true,
360
- "special": true
361
- },
362
- {
363
- "id": 32033,
364
- "content": "<extra_id_66>",
365
- "single_word": false,
366
- "lstrip": true,
367
- "rstrip": false,
368
- "normalized": true,
369
- "special": true
370
- },
371
- {
372
- "id": 32034,
373
- "content": "<extra_id_65>",
374
- "single_word": false,
375
- "lstrip": true,
376
- "rstrip": false,
377
- "normalized": true,
378
- "special": true
379
- },
380
- {
381
- "id": 32035,
382
- "content": "<extra_id_64>",
383
- "single_word": false,
384
- "lstrip": true,
385
- "rstrip": false,
386
- "normalized": true,
387
- "special": true
388
- },
389
- {
390
- "id": 32036,
391
- "content": "<extra_id_63>",
392
- "single_word": false,
393
- "lstrip": true,
394
- "rstrip": false,
395
- "normalized": true,
396
- "special": true
397
- },
398
- {
399
- "id": 32037,
400
- "content": "<extra_id_62>",
401
- "single_word": false,
402
- "lstrip": true,
403
- "rstrip": false,
404
- "normalized": true,
405
- "special": true
406
- },
407
- {
408
- "id": 32038,
409
- "content": "<extra_id_61>",
410
- "single_word": false,
411
- "lstrip": true,
412
- "rstrip": false,
413
- "normalized": true,
414
- "special": true
415
- },
416
- {
417
- "id": 32039,
418
- "content": "<extra_id_60>",
419
- "single_word": false,
420
- "lstrip": true,
421
- "rstrip": false,
422
- "normalized": true,
423
- "special": true
424
- },
425
- {
426
- "id": 32040,
427
- "content": "<extra_id_59>",
428
- "single_word": false,
429
- "lstrip": true,
430
- "rstrip": false,
431
- "normalized": true,
432
- "special": true
433
- },
434
- {
435
- "id": 32041,
436
- "content": "<extra_id_58>",
437
- "single_word": false,
438
- "lstrip": true,
439
- "rstrip": false,
440
- "normalized": true,
441
- "special": true
442
- },
443
- {
444
- "id": 32042,
445
- "content": "<extra_id_57>",
446
- "single_word": false,
447
- "lstrip": true,
448
- "rstrip": false,
449
- "normalized": true,
450
- "special": true
451
- },
452
- {
453
- "id": 32043,
454
- "content": "<extra_id_56>",
455
- "single_word": false,
456
- "lstrip": true,
457
- "rstrip": false,
458
- "normalized": true,
459
- "special": true
460
- },
461
- {
462
- "id": 32044,
463
- "content": "<extra_id_55>",
464
- "single_word": false,
465
- "lstrip": true,
466
- "rstrip": false,
467
- "normalized": true,
468
- "special": true
469
- },
470
- {
471
- "id": 32045,
472
- "content": "<extra_id_54>",
473
- "single_word": false,
474
- "lstrip": true,
475
- "rstrip": false,
476
- "normalized": true,
477
- "special": true
478
- },
479
- {
480
- "id": 32046,
481
- "content": "<extra_id_53>",
482
- "single_word": false,
483
- "lstrip": true,
484
- "rstrip": false,
485
- "normalized": true,
486
- "special": true
487
- },
488
- {
489
- "id": 32047,
490
- "content": "<extra_id_52>",
491
- "single_word": false,
492
- "lstrip": true,
493
- "rstrip": false,
494
- "normalized": true,
495
- "special": true
496
- },
497
- {
498
- "id": 32048,
499
- "content": "<extra_id_51>",
500
- "single_word": false,
501
- "lstrip": true,
502
- "rstrip": false,
503
- "normalized": true,
504
- "special": true
505
- },
506
- {
507
- "id": 32049,
508
- "content": "<extra_id_50>",
509
- "single_word": false,
510
- "lstrip": true,
511
- "rstrip": false,
512
- "normalized": true,
513
- "special": true
514
- },
515
- {
516
- "id": 32050,
517
- "content": "<extra_id_49>",
518
- "single_word": false,
519
- "lstrip": true,
520
- "rstrip": false,
521
- "normalized": true,
522
- "special": true
523
- },
524
- {
525
- "id": 32051,
526
- "content": "<extra_id_48>",
527
- "single_word": false,
528
- "lstrip": true,
529
- "rstrip": false,
530
- "normalized": true,
531
- "special": true
532
- },
533
- {
534
- "id": 32052,
535
- "content": "<extra_id_47>",
536
- "single_word": false,
537
- "lstrip": true,
538
- "rstrip": false,
539
- "normalized": true,
540
- "special": true
541
- },
542
- {
543
- "id": 32053,
544
- "content": "<extra_id_46>",
545
- "single_word": false,
546
- "lstrip": true,
547
- "rstrip": false,
548
- "normalized": true,
549
- "special": true
550
- },
551
- {
552
- "id": 32054,
553
- "content": "<extra_id_45>",
554
- "single_word": false,
555
- "lstrip": true,
556
- "rstrip": false,
557
- "normalized": true,
558
- "special": true
559
- },
560
- {
561
- "id": 32055,
562
- "content": "<extra_id_44>",
563
- "single_word": false,
564
- "lstrip": true,
565
- "rstrip": false,
566
- "normalized": true,
567
- "special": true
568
- },
569
- {
570
- "id": 32056,
571
- "content": "<extra_id_43>",
572
- "single_word": false,
573
- "lstrip": true,
574
- "rstrip": false,
575
- "normalized": true,
576
- "special": true
577
- },
578
- {
579
- "id": 32057,
580
- "content": "<extra_id_42>",
581
- "single_word": false,
582
- "lstrip": true,
583
- "rstrip": false,
584
- "normalized": true,
585
- "special": true
586
- },
587
- {
588
- "id": 32058,
589
- "content": "<extra_id_41>",
590
- "single_word": false,
591
- "lstrip": true,
592
- "rstrip": false,
593
- "normalized": true,
594
- "special": true
595
- },
596
- {
597
- "id": 32059,
598
- "content": "<extra_id_40>",
599
- "single_word": false,
600
- "lstrip": true,
601
- "rstrip": false,
602
- "normalized": true,
603
- "special": true
604
- },
605
- {
606
- "id": 32060,
607
- "content": "<extra_id_39>",
608
- "single_word": false,
609
- "lstrip": true,
610
- "rstrip": false,
611
- "normalized": true,
612
- "special": true
613
- },
614
- {
615
- "id": 32061,
616
- "content": "<extra_id_38>",
617
- "single_word": false,
618
- "lstrip": true,
619
- "rstrip": false,
620
- "normalized": true,
621
- "special": true
622
- },
623
- {
624
- "id": 32062,
625
- "content": "<extra_id_37>",
626
- "single_word": false,
627
- "lstrip": true,
628
- "rstrip": false,
629
- "normalized": true,
630
- "special": true
631
- },
632
- {
633
- "id": 32063,
634
- "content": "<extra_id_36>",
635
- "single_word": false,
636
- "lstrip": true,
637
- "rstrip": false,
638
- "normalized": true,
639
- "special": true
640
- },
641
- {
642
- "id": 32064,
643
- "content": "<extra_id_35>",
644
- "single_word": false,
645
- "lstrip": true,
646
- "rstrip": false,
647
- "normalized": true,
648
- "special": true
649
- },
650
- {
651
- "id": 32065,
652
- "content": "<extra_id_34>",
653
- "single_word": false,
654
- "lstrip": true,
655
- "rstrip": false,
656
- "normalized": true,
657
- "special": true
658
- },
659
- {
660
- "id": 32066,
661
- "content": "<extra_id_33>",
662
- "single_word": false,
663
- "lstrip": true,
664
- "rstrip": false,
665
- "normalized": true,
666
- "special": true
667
- },
668
- {
669
- "id": 32067,
670
- "content": "<extra_id_32>",
671
- "single_word": false,
672
- "lstrip": true,
673
- "rstrip": false,
674
- "normalized": true,
675
- "special": true
676
- },
677
- {
678
- "id": 32068,
679
- "content": "<extra_id_31>",
680
- "single_word": false,
681
- "lstrip": true,
682
- "rstrip": false,
683
- "normalized": true,
684
- "special": true
685
- },
686
- {
687
- "id": 32069,
688
- "content": "<extra_id_30>",
689
- "single_word": false,
690
- "lstrip": true,
691
- "rstrip": false,
692
- "normalized": true,
693
- "special": true
694
- },
695
- {
696
- "id": 32070,
697
- "content": "<extra_id_29>",
698
- "single_word": false,
699
- "lstrip": true,
700
- "rstrip": false,
701
- "normalized": true,
702
- "special": true
703
- },
704
- {
705
- "id": 32071,
706
- "content": "<extra_id_28>",
707
- "single_word": false,
708
- "lstrip": true,
709
- "rstrip": false,
710
- "normalized": true,
711
- "special": true
712
- },
713
- {
714
- "id": 32072,
715
- "content": "<extra_id_27>",
716
- "single_word": false,
717
- "lstrip": true,
718
- "rstrip": false,
719
- "normalized": true,
720
- "special": true
721
- },
722
- {
723
- "id": 32073,
724
- "content": "<extra_id_26>",
725
- "single_word": false,
726
- "lstrip": true,
727
- "rstrip": false,
728
- "normalized": true,
729
- "special": true
730
- },
731
- {
732
- "id": 32074,
733
- "content": "<extra_id_25>",
734
- "single_word": false,
735
- "lstrip": true,
736
- "rstrip": false,
737
- "normalized": true,
738
- "special": true
739
- },
740
- {
741
- "id": 32075,
742
- "content": "<extra_id_24>",
743
- "single_word": false,
744
- "lstrip": true,
745
- "rstrip": false,
746
- "normalized": true,
747
- "special": true
748
- },
749
- {
750
- "id": 32076,
751
- "content": "<extra_id_23>",
752
- "single_word": false,
753
- "lstrip": true,
754
- "rstrip": false,
755
- "normalized": true,
756
- "special": true
757
- },
758
- {
759
- "id": 32077,
760
- "content": "<extra_id_22>",
761
- "single_word": false,
762
- "lstrip": true,
763
- "rstrip": false,
764
- "normalized": true,
765
- "special": true
766
- },
767
- {
768
- "id": 32078,
769
- "content": "<extra_id_21>",
770
- "single_word": false,
771
- "lstrip": true,
772
- "rstrip": false,
773
- "normalized": true,
774
- "special": true
775
- },
776
- {
777
- "id": 32079,
778
- "content": "<extra_id_20>",
779
- "single_word": false,
780
- "lstrip": true,
781
- "rstrip": false,
782
- "normalized": true,
783
- "special": true
784
- },
785
- {
786
- "id": 32080,
787
- "content": "<extra_id_19>",
788
- "single_word": false,
789
- "lstrip": true,
790
- "rstrip": false,
791
- "normalized": true,
792
- "special": true
793
- },
794
- {
795
- "id": 32081,
796
- "content": "<extra_id_18>",
797
- "single_word": false,
798
- "lstrip": true,
799
- "rstrip": false,
800
- "normalized": true,
801
- "special": true
802
- },
803
- {
804
- "id": 32082,
805
- "content": "<extra_id_17>",
806
- "single_word": false,
807
- "lstrip": true,
808
- "rstrip": false,
809
- "normalized": true,
810
- "special": true
811
- },
812
- {
813
- "id": 32083,
814
- "content": "<extra_id_16>",
815
- "single_word": false,
816
- "lstrip": true,
817
- "rstrip": false,
818
- "normalized": true,
819
- "special": true
820
- },
821
- {
822
- "id": 32084,
823
- "content": "<extra_id_15>",
824
- "single_word": false,
825
- "lstrip": true,
826
- "rstrip": false,
827
- "normalized": true,
828
- "special": true
829
- },
830
- {
831
- "id": 32085,
832
- "content": "<extra_id_14>",
833
- "single_word": false,
834
- "lstrip": true,
835
- "rstrip": false,
836
- "normalized": true,
837
- "special": true
838
- },
839
- {
840
- "id": 32086,
841
- "content": "<extra_id_13>",
842
- "single_word": false,
843
- "lstrip": true,
844
- "rstrip": false,
845
- "normalized": true,
846
- "special": true
847
- },
848
- {
849
- "id": 32087,
850
- "content": "<extra_id_12>",
851
- "single_word": false,
852
- "lstrip": true,
853
- "rstrip": false,
854
- "normalized": true,
855
- "special": true
856
- },
857
- {
858
- "id": 32088,
859
- "content": "<extra_id_11>",
860
- "single_word": false,
861
- "lstrip": true,
862
- "rstrip": false,
863
- "normalized": true,
864
- "special": true
865
- },
866
- {
867
- "id": 32089,
868
- "content": "<extra_id_10>",
869
- "single_word": false,
870
- "lstrip": true,
871
- "rstrip": false,
872
- "normalized": true,
873
- "special": true
874
- },
875
- {
876
- "id": 32090,
877
- "content": "<extra_id_9>",
878
- "single_word": false,
879
- "lstrip": true,
880
- "rstrip": false,
881
- "normalized": true,
882
- "special": true
883
- },
884
- {
885
- "id": 32091,
886
- "content": "<extra_id_8>",
887
- "single_word": false,
888
- "lstrip": true,
889
- "rstrip": false,
890
- "normalized": true,
891
- "special": true
892
- },
893
- {
894
- "id": 32092,
895
- "content": "<extra_id_7>",
896
- "single_word": false,
897
- "lstrip": true,
898
- "rstrip": false,
899
- "normalized": true,
900
- "special": true
901
- },
902
- {
903
- "id": 32093,
904
- "content": "<extra_id_6>",
905
- "single_word": false,
906
- "lstrip": true,
907
- "rstrip": false,
908
- "normalized": true,
909
- "special": true
910
- },
911
- {
912
- "id": 32094,
913
- "content": "<extra_id_5>",
914
- "single_word": false,
915
- "lstrip": true,
916
- "rstrip": false,
917
- "normalized": true,
918
- "special": true
919
- },
920
- {
921
- "id": 32095,
922
- "content": "<extra_id_4>",
923
- "single_word": false,
924
- "lstrip": true,
925
- "rstrip": false,
926
- "normalized": true,
927
- "special": true
928
- },
929
- {
930
- "id": 32096,
931
- "content": "<extra_id_3>",
932
- "single_word": false,
933
- "lstrip": true,
934
- "rstrip": false,
935
- "normalized": true,
936
- "special": true
937
- },
938
- {
939
- "id": 32097,
940
- "content": "<extra_id_2>",
941
- "single_word": false,
942
- "lstrip": true,
943
- "rstrip": false,
944
- "normalized": true,
945
- "special": true
946
- },
947
- {
948
- "id": 32098,
949
- "content": "<extra_id_1>",
950
- "single_word": false,
951
- "lstrip": true,
952
- "rstrip": false,
953
- "normalized": true,
954
- "special": true
955
- },
956
- {
957
- "id": 32099,
958
- "content": "<extra_id_0>",
959
- "single_word": false,
960
- "lstrip": true,
961
- "rstrip": false,
962
- "normalized": true,
963
- "special": true
964
  }
965
  ],
966
  "normalizer": null,
@@ -36813,10 +35913,6 @@
36813
  "pr",
36814
  "int"
36815
  ],
36816
- [
36817
- "#",
36818
- "#"
36819
- ],
36820
  [
36821
  "W",
36822
  "ith"
@@ -39937,10 +39033,6 @@
39937
  "b",
39938
  "ase"
39939
  ],
39940
- [
39941
- "##",
39942
- "##"
39943
- ],
39944
  [
39945
  "R",
39946
  "el"
@@ -44969,10 +44061,6 @@
44969
  "Ġre",
44970
  "trie"
44971
  ],
44972
- [
44973
- "####",
44974
- "####"
44975
- ],
44976
  [
44977
  "Ġmult",
44978
  "iple"
@@ -46625,10 +45713,6 @@
46625
  "At",
46626
  "om"
46627
  ],
46628
- [
46629
- "#",
46630
- "{"
46631
- ],
46632
  [
46633
  "Ġro",
46634
  "und"
@@ -54121,10 +53205,6 @@
54121
  "Ġex",
54122
  "plicit"
54123
  ],
54124
- [
54125
- "########",
54126
- "########"
54127
- ],
54128
  [
54129
  "Service",
54130
  "Response"
@@ -72209,10 +71289,6 @@
72209
  "el",
72210
  "em"
72211
  ],
72212
- [
72213
- "#",
72214
- "'"
72215
- ],
72216
  [
72217
  "Ġcon",
72218
  "versation"
@@ -72617,10 +71693,6 @@
72617
  "ĠPre",
72618
  "fix"
72619
  ],
72620
- [
72621
- "################",
72622
- "################"
72623
- ],
72624
  [
72625
  "s",
72626
  "ources"
@@ -84661,10 +83733,6 @@
84661
  "Ġh",
84662
  "el"
84663
  ],
84664
- [
84665
- "##",
84666
- "#"
84667
- ],
84668
  [
84669
  "And",
84670
  "Set"
@@ -100589,10 +99657,6 @@
100589
  "Ġrule",
100590
  "ValidID"
100591
  ],
100592
- [
100593
- "#",
100594
- "\""
100595
- ],
100596
  [
100597
  "^",
100598
  "\\"
@@ -116621,10 +115685,6 @@
116621
  "ĠUn",
116622
  "der"
116623
  ],
116624
- [
116625
- "#{",
116626
- "@"
116627
- ],
116628
  [
116629
  "ĠAct",
116630
  "or"
@@ -138005,10 +137065,6 @@
138005
  "Queue",
138006
  "Entry"
138007
  ],
138008
- [
138009
- "########",
138010
- "####"
138011
- ],
138012
  [
138013
  "alan",
138014
  "ces"
@@ -154045,10 +153101,6 @@
154045
  "SETT",
154046
  "ABLE"
154047
  ],
154048
- [
154049
- "#",
154050
- "$"
154051
- ],
154052
  [
154053
  "C",
154054
  "ores"
@@ -154449,10 +153501,6 @@
154449
  "ENDI",
154450
  "AN"
154451
  ],
154452
- [
154453
- "#",
154454
- "__"
154455
- ],
154456
  [
154457
  ">",
154458
  "`"
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 256,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 256
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
61
  "rstrip": false,
62
  "normalized": true,
63
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  }
65
  ],
66
  "normalizer": null,
 
35913
  "pr",
35914
  "int"
35915
  ],
 
 
 
 
35916
  [
35917
  "W",
35918
  "ith"
 
39033
  "b",
39034
  "ase"
39035
  ],
 
 
 
 
39036
  [
39037
  "R",
39038
  "el"
 
44061
  "Ġre",
44062
  "trie"
44063
  ],
 
 
 
 
44064
  [
44065
  "Ġmult",
44066
  "iple"
 
45713
  "At",
45714
  "om"
45715
  ],
 
 
 
 
45716
  [
45717
  "Ġro",
45718
  "und"
 
53205
  "Ġex",
53206
  "plicit"
53207
  ],
 
 
 
 
53208
  [
53209
  "Service",
53210
  "Response"
 
71289
  "el",
71290
  "em"
71291
  ],
 
 
 
 
71292
  [
71293
  "Ġcon",
71294
  "versation"
 
71693
  "ĠPre",
71694
  "fix"
71695
  ],
 
 
 
 
71696
  [
71697
  "s",
71698
  "ources"
 
83733
  "Ġh",
83734
  "el"
83735
  ],
 
 
 
 
83736
  [
83737
  "And",
83738
  "Set"
 
99657
  "Ġrule",
99658
  "ValidID"
99659
  ],
 
 
 
 
99660
  [
99661
  "^",
99662
  "\\"
 
115685
  "ĠUn",
115686
  "der"
115687
  ],
 
 
 
 
115688
  [
115689
  "ĠAct",
115690
  "or"
 
137065
  "Queue",
137066
  "Entry"
137067
  ],
 
 
 
 
137068
  [
137069
  "alan",
137070
  "ces"
 
153101
  "SETT",
153102
  "ABLE"
153103
  ],
 
 
 
 
153104
  [
153105
  "C",
153106
  "ores"
 
153501
  "ENDI",
153502
  "AN"
153503
  ],
 
 
 
 
153504
  [
153505
  ">",
153506
  "`"
tokenizer_config.json CHANGED
@@ -1,955 +1,714 @@
1
  {
2
  "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "<pad>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "1": {
13
- "content": "<s>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- },
20
- "2": {
21
- "content": "</s>",
22
- "lstrip": false,
23
- "normalized": true,
24
- "rstrip": false,
25
- "single_word": false,
26
- "special": true
27
- },
28
- "3": {
29
- "content": "<unk>",
30
- "lstrip": false,
31
- "normalized": true,
32
- "rstrip": false,
33
- "single_word": false,
34
- "special": true
35
- },
36
- "4": {
37
- "content": "<mask>",
38
- "lstrip": true,
39
- "normalized": true,
40
- "rstrip": false,
41
- "single_word": false,
42
- "special": true
43
- },
44
- "32000": {
45
  "content": "<extra_id_99>",
46
  "lstrip": true,
47
  "normalized": true,
48
  "rstrip": false,
49
- "single_word": false,
50
- "special": true
51
  },
52
- "32001": {
53
  "content": "<extra_id_98>",
54
  "lstrip": true,
55
  "normalized": true,
56
  "rstrip": false,
57
- "single_word": false,
58
- "special": true
59
  },
60
- "32002": {
61
  "content": "<extra_id_97>",
62
  "lstrip": true,
63
  "normalized": true,
64
  "rstrip": false,
65
- "single_word": false,
66
- "special": true
67
  },
68
- "32003": {
69
  "content": "<extra_id_96>",
70
  "lstrip": true,
71
  "normalized": true,
72
  "rstrip": false,
73
- "single_word": false,
74
- "special": true
75
  },
76
- "32004": {
77
  "content": "<extra_id_95>",
78
  "lstrip": true,
79
  "normalized": true,
80
  "rstrip": false,
81
- "single_word": false,
82
- "special": true
83
  },
84
- "32005": {
85
  "content": "<extra_id_94>",
86
  "lstrip": true,
87
  "normalized": true,
88
  "rstrip": false,
89
- "single_word": false,
90
- "special": true
91
  },
92
- "32006": {
93
  "content": "<extra_id_93>",
94
  "lstrip": true,
95
  "normalized": true,
96
  "rstrip": false,
97
- "single_word": false,
98
- "special": true
99
  },
100
- "32007": {
101
  "content": "<extra_id_92>",
102
  "lstrip": true,
103
  "normalized": true,
104
  "rstrip": false,
105
- "single_word": false,
106
- "special": true
107
  },
108
- "32008": {
109
  "content": "<extra_id_91>",
110
  "lstrip": true,
111
  "normalized": true,
112
  "rstrip": false,
113
- "single_word": false,
114
- "special": true
115
  },
116
- "32009": {
117
  "content": "<extra_id_90>",
118
  "lstrip": true,
119
  "normalized": true,
120
  "rstrip": false,
121
- "single_word": false,
122
- "special": true
123
  },
124
- "32010": {
125
  "content": "<extra_id_89>",
126
  "lstrip": true,
127
  "normalized": true,
128
  "rstrip": false,
129
- "single_word": false,
130
- "special": true
131
  },
132
- "32011": {
133
  "content": "<extra_id_88>",
134
  "lstrip": true,
135
  "normalized": true,
136
  "rstrip": false,
137
- "single_word": false,
138
- "special": true
139
  },
140
- "32012": {
141
  "content": "<extra_id_87>",
142
  "lstrip": true,
143
  "normalized": true,
144
  "rstrip": false,
145
- "single_word": false,
146
- "special": true
147
  },
148
- "32013": {
149
  "content": "<extra_id_86>",
150
  "lstrip": true,
151
  "normalized": true,
152
  "rstrip": false,
153
- "single_word": false,
154
- "special": true
155
  },
156
- "32014": {
157
  "content": "<extra_id_85>",
158
  "lstrip": true,
159
  "normalized": true,
160
  "rstrip": false,
161
- "single_word": false,
162
- "special": true
163
  },
164
- "32015": {
165
  "content": "<extra_id_84>",
166
  "lstrip": true,
167
  "normalized": true,
168
  "rstrip": false,
169
- "single_word": false,
170
- "special": true
171
  },
172
- "32016": {
173
  "content": "<extra_id_83>",
174
  "lstrip": true,
175
  "normalized": true,
176
  "rstrip": false,
177
- "single_word": false,
178
- "special": true
179
  },
180
- "32017": {
181
  "content": "<extra_id_82>",
182
  "lstrip": true,
183
  "normalized": true,
184
  "rstrip": false,
185
- "single_word": false,
186
- "special": true
187
  },
188
- "32018": {
189
  "content": "<extra_id_81>",
190
  "lstrip": true,
191
  "normalized": true,
192
  "rstrip": false,
193
- "single_word": false,
194
- "special": true
195
  },
196
- "32019": {
197
  "content": "<extra_id_80>",
198
  "lstrip": true,
199
  "normalized": true,
200
  "rstrip": false,
201
- "single_word": false,
202
- "special": true
203
  },
204
- "32020": {
205
  "content": "<extra_id_79>",
206
  "lstrip": true,
207
  "normalized": true,
208
  "rstrip": false,
209
- "single_word": false,
210
- "special": true
211
  },
212
- "32021": {
213
  "content": "<extra_id_78>",
214
  "lstrip": true,
215
  "normalized": true,
216
  "rstrip": false,
217
- "single_word": false,
218
- "special": true
219
  },
220
- "32022": {
221
  "content": "<extra_id_77>",
222
  "lstrip": true,
223
  "normalized": true,
224
  "rstrip": false,
225
- "single_word": false,
226
- "special": true
227
  },
228
- "32023": {
229
  "content": "<extra_id_76>",
230
  "lstrip": true,
231
  "normalized": true,
232
  "rstrip": false,
233
- "single_word": false,
234
- "special": true
235
  },
236
- "32024": {
237
  "content": "<extra_id_75>",
238
  "lstrip": true,
239
  "normalized": true,
240
  "rstrip": false,
241
- "single_word": false,
242
- "special": true
243
  },
244
- "32025": {
245
  "content": "<extra_id_74>",
246
  "lstrip": true,
247
  "normalized": true,
248
  "rstrip": false,
249
- "single_word": false,
250
- "special": true
251
  },
252
- "32026": {
253
  "content": "<extra_id_73>",
254
  "lstrip": true,
255
  "normalized": true,
256
  "rstrip": false,
257
- "single_word": false,
258
- "special": true
259
  },
260
- "32027": {
261
  "content": "<extra_id_72>",
262
  "lstrip": true,
263
  "normalized": true,
264
  "rstrip": false,
265
- "single_word": false,
266
- "special": true
267
  },
268
- "32028": {
269
  "content": "<extra_id_71>",
270
  "lstrip": true,
271
  "normalized": true,
272
  "rstrip": false,
273
- "single_word": false,
274
- "special": true
275
  },
276
- "32029": {
277
  "content": "<extra_id_70>",
278
  "lstrip": true,
279
  "normalized": true,
280
  "rstrip": false,
281
- "single_word": false,
282
- "special": true
283
  },
284
- "32030": {
285
  "content": "<extra_id_69>",
286
  "lstrip": true,
287
  "normalized": true,
288
  "rstrip": false,
289
- "single_word": false,
290
- "special": true
291
  },
292
- "32031": {
293
  "content": "<extra_id_68>",
294
  "lstrip": true,
295
  "normalized": true,
296
  "rstrip": false,
297
- "single_word": false,
298
- "special": true
299
  },
300
- "32032": {
301
  "content": "<extra_id_67>",
302
  "lstrip": true,
303
  "normalized": true,
304
  "rstrip": false,
305
- "single_word": false,
306
- "special": true
307
  },
308
- "32033": {
309
  "content": "<extra_id_66>",
310
  "lstrip": true,
311
  "normalized": true,
312
  "rstrip": false,
313
- "single_word": false,
314
- "special": true
315
  },
316
- "32034": {
317
  "content": "<extra_id_65>",
318
  "lstrip": true,
319
  "normalized": true,
320
  "rstrip": false,
321
- "single_word": false,
322
- "special": true
323
  },
324
- "32035": {
325
  "content": "<extra_id_64>",
326
  "lstrip": true,
327
  "normalized": true,
328
  "rstrip": false,
329
- "single_word": false,
330
- "special": true
331
  },
332
- "32036": {
333
  "content": "<extra_id_63>",
334
  "lstrip": true,
335
  "normalized": true,
336
  "rstrip": false,
337
- "single_word": false,
338
- "special": true
339
  },
340
- "32037": {
341
  "content": "<extra_id_62>",
342
  "lstrip": true,
343
  "normalized": true,
344
  "rstrip": false,
345
- "single_word": false,
346
- "special": true
347
  },
348
- "32038": {
349
  "content": "<extra_id_61>",
350
  "lstrip": true,
351
  "normalized": true,
352
  "rstrip": false,
353
- "single_word": false,
354
- "special": true
355
  },
356
- "32039": {
357
  "content": "<extra_id_60>",
358
  "lstrip": true,
359
  "normalized": true,
360
  "rstrip": false,
361
- "single_word": false,
362
- "special": true
363
  },
364
- "32040": {
365
  "content": "<extra_id_59>",
366
  "lstrip": true,
367
  "normalized": true,
368
  "rstrip": false,
369
- "single_word": false,
370
- "special": true
371
  },
372
- "32041": {
373
  "content": "<extra_id_58>",
374
  "lstrip": true,
375
  "normalized": true,
376
  "rstrip": false,
377
- "single_word": false,
378
- "special": true
379
  },
380
- "32042": {
381
  "content": "<extra_id_57>",
382
  "lstrip": true,
383
  "normalized": true,
384
  "rstrip": false,
385
- "single_word": false,
386
- "special": true
387
  },
388
- "32043": {
389
  "content": "<extra_id_56>",
390
  "lstrip": true,
391
  "normalized": true,
392
  "rstrip": false,
393
- "single_word": false,
394
- "special": true
395
  },
396
- "32044": {
397
  "content": "<extra_id_55>",
398
  "lstrip": true,
399
  "normalized": true,
400
  "rstrip": false,
401
- "single_word": false,
402
- "special": true
403
  },
404
- "32045": {
405
  "content": "<extra_id_54>",
406
  "lstrip": true,
407
  "normalized": true,
408
  "rstrip": false,
409
- "single_word": false,
410
- "special": true
411
  },
412
- "32046": {
413
  "content": "<extra_id_53>",
414
  "lstrip": true,
415
  "normalized": true,
416
  "rstrip": false,
417
- "single_word": false,
418
- "special": true
419
  },
420
- "32047": {
421
  "content": "<extra_id_52>",
422
  "lstrip": true,
423
  "normalized": true,
424
  "rstrip": false,
425
- "single_word": false,
426
- "special": true
427
  },
428
- "32048": {
429
  "content": "<extra_id_51>",
430
  "lstrip": true,
431
  "normalized": true,
432
  "rstrip": false,
433
- "single_word": false,
434
- "special": true
435
  },
436
- "32049": {
437
  "content": "<extra_id_50>",
438
  "lstrip": true,
439
  "normalized": true,
440
  "rstrip": false,
441
- "single_word": false,
442
- "special": true
443
  },
444
- "32050": {
445
  "content": "<extra_id_49>",
446
  "lstrip": true,
447
  "normalized": true,
448
  "rstrip": false,
449
- "single_word": false,
450
- "special": true
451
  },
452
- "32051": {
453
  "content": "<extra_id_48>",
454
  "lstrip": true,
455
  "normalized": true,
456
  "rstrip": false,
457
- "single_word": false,
458
- "special": true
459
  },
460
- "32052": {
461
  "content": "<extra_id_47>",
462
  "lstrip": true,
463
  "normalized": true,
464
  "rstrip": false,
465
- "single_word": false,
466
- "special": true
467
  },
468
- "32053": {
469
  "content": "<extra_id_46>",
470
  "lstrip": true,
471
  "normalized": true,
472
  "rstrip": false,
473
- "single_word": false,
474
- "special": true
475
  },
476
- "32054": {
477
  "content": "<extra_id_45>",
478
  "lstrip": true,
479
  "normalized": true,
480
  "rstrip": false,
481
- "single_word": false,
482
- "special": true
483
  },
484
- "32055": {
485
  "content": "<extra_id_44>",
486
  "lstrip": true,
487
  "normalized": true,
488
  "rstrip": false,
489
- "single_word": false,
490
- "special": true
491
  },
492
- "32056": {
493
  "content": "<extra_id_43>",
494
  "lstrip": true,
495
  "normalized": true,
496
  "rstrip": false,
497
- "single_word": false,
498
- "special": true
499
  },
500
- "32057": {
501
  "content": "<extra_id_42>",
502
  "lstrip": true,
503
  "normalized": true,
504
  "rstrip": false,
505
- "single_word": false,
506
- "special": true
507
  },
508
- "32058": {
509
  "content": "<extra_id_41>",
510
  "lstrip": true,
511
  "normalized": true,
512
  "rstrip": false,
513
- "single_word": false,
514
- "special": true
515
  },
516
- "32059": {
517
  "content": "<extra_id_40>",
518
  "lstrip": true,
519
  "normalized": true,
520
  "rstrip": false,
521
- "single_word": false,
522
- "special": true
523
  },
524
- "32060": {
525
  "content": "<extra_id_39>",
526
  "lstrip": true,
527
  "normalized": true,
528
  "rstrip": false,
529
- "single_word": false,
530
- "special": true
531
  },
532
- "32061": {
533
  "content": "<extra_id_38>",
534
  "lstrip": true,
535
  "normalized": true,
536
  "rstrip": false,
537
- "single_word": false,
538
- "special": true
539
  },
540
- "32062": {
541
  "content": "<extra_id_37>",
542
  "lstrip": true,
543
  "normalized": true,
544
  "rstrip": false,
545
- "single_word": false,
546
- "special": true
547
  },
548
- "32063": {
549
  "content": "<extra_id_36>",
550
  "lstrip": true,
551
  "normalized": true,
552
  "rstrip": false,
553
- "single_word": false,
554
- "special": true
555
  },
556
- "32064": {
557
  "content": "<extra_id_35>",
558
  "lstrip": true,
559
  "normalized": true,
560
  "rstrip": false,
561
- "single_word": false,
562
- "special": true
563
  },
564
- "32065": {
565
  "content": "<extra_id_34>",
566
  "lstrip": true,
567
  "normalized": true,
568
  "rstrip": false,
569
- "single_word": false,
570
- "special": true
571
  },
572
- "32066": {
573
  "content": "<extra_id_33>",
574
  "lstrip": true,
575
  "normalized": true,
576
  "rstrip": false,
577
- "single_word": false,
578
- "special": true
579
  },
580
- "32067": {
581
  "content": "<extra_id_32>",
582
  "lstrip": true,
583
  "normalized": true,
584
  "rstrip": false,
585
- "single_word": false,
586
- "special": true
587
  },
588
- "32068": {
589
  "content": "<extra_id_31>",
590
  "lstrip": true,
591
  "normalized": true,
592
  "rstrip": false,
593
- "single_word": false,
594
- "special": true
595
  },
596
- "32069": {
597
  "content": "<extra_id_30>",
598
  "lstrip": true,
599
  "normalized": true,
600
  "rstrip": false,
601
- "single_word": false,
602
- "special": true
603
  },
604
- "32070": {
605
  "content": "<extra_id_29>",
606
  "lstrip": true,
607
  "normalized": true,
608
  "rstrip": false,
609
- "single_word": false,
610
- "special": true
611
  },
612
- "32071": {
613
  "content": "<extra_id_28>",
614
  "lstrip": true,
615
  "normalized": true,
616
  "rstrip": false,
617
- "single_word": false,
618
- "special": true
619
  },
620
- "32072": {
621
  "content": "<extra_id_27>",
622
  "lstrip": true,
623
  "normalized": true,
624
  "rstrip": false,
625
- "single_word": false,
626
- "special": true
627
  },
628
- "32073": {
629
  "content": "<extra_id_26>",
630
  "lstrip": true,
631
  "normalized": true,
632
  "rstrip": false,
633
- "single_word": false,
634
- "special": true
635
  },
636
- "32074": {
637
  "content": "<extra_id_25>",
638
  "lstrip": true,
639
  "normalized": true,
640
  "rstrip": false,
641
- "single_word": false,
642
- "special": true
643
  },
644
- "32075": {
645
  "content": "<extra_id_24>",
646
  "lstrip": true,
647
  "normalized": true,
648
  "rstrip": false,
649
- "single_word": false,
650
- "special": true
651
  },
652
- "32076": {
653
  "content": "<extra_id_23>",
654
  "lstrip": true,
655
  "normalized": true,
656
  "rstrip": false,
657
- "single_word": false,
658
- "special": true
659
  },
660
- "32077": {
661
  "content": "<extra_id_22>",
662
  "lstrip": true,
663
  "normalized": true,
664
  "rstrip": false,
665
- "single_word": false,
666
- "special": true
667
  },
668
- "32078": {
669
  "content": "<extra_id_21>",
670
  "lstrip": true,
671
  "normalized": true,
672
  "rstrip": false,
673
- "single_word": false,
674
- "special": true
675
  },
676
- "32079": {
677
  "content": "<extra_id_20>",
678
  "lstrip": true,
679
  "normalized": true,
680
  "rstrip": false,
681
- "single_word": false,
682
- "special": true
683
  },
684
- "32080": {
685
  "content": "<extra_id_19>",
686
  "lstrip": true,
687
  "normalized": true,
688
  "rstrip": false,
689
- "single_word": false,
690
- "special": true
691
  },
692
- "32081": {
693
  "content": "<extra_id_18>",
694
  "lstrip": true,
695
  "normalized": true,
696
  "rstrip": false,
697
- "single_word": false,
698
- "special": true
699
  },
700
- "32082": {
701
  "content": "<extra_id_17>",
702
  "lstrip": true,
703
  "normalized": true,
704
  "rstrip": false,
705
- "single_word": false,
706
- "special": true
707
  },
708
- "32083": {
709
  "content": "<extra_id_16>",
710
  "lstrip": true,
711
  "normalized": true,
712
  "rstrip": false,
713
- "single_word": false,
714
- "special": true
715
  },
716
- "32084": {
717
  "content": "<extra_id_15>",
718
  "lstrip": true,
719
  "normalized": true,
720
  "rstrip": false,
721
- "single_word": false,
722
- "special": true
723
  },
724
- "32085": {
725
  "content": "<extra_id_14>",
726
  "lstrip": true,
727
  "normalized": true,
728
  "rstrip": false,
729
- "single_word": false,
730
- "special": true
731
  },
732
- "32086": {
733
  "content": "<extra_id_13>",
734
  "lstrip": true,
735
  "normalized": true,
736
  "rstrip": false,
737
- "single_word": false,
738
- "special": true
739
  },
740
- "32087": {
741
  "content": "<extra_id_12>",
742
  "lstrip": true,
743
  "normalized": true,
744
  "rstrip": false,
745
- "single_word": false,
746
- "special": true
747
  },
748
- "32088": {
749
  "content": "<extra_id_11>",
750
  "lstrip": true,
751
  "normalized": true,
752
  "rstrip": false,
753
- "single_word": false,
754
- "special": true
755
  },
756
- "32089": {
757
  "content": "<extra_id_10>",
758
  "lstrip": true,
759
  "normalized": true,
760
  "rstrip": false,
761
- "single_word": false,
762
- "special": true
763
  },
764
- "32090": {
765
  "content": "<extra_id_9>",
766
  "lstrip": true,
767
  "normalized": true,
768
  "rstrip": false,
769
- "single_word": false,
770
- "special": true
771
  },
772
- "32091": {
773
  "content": "<extra_id_8>",
774
  "lstrip": true,
775
  "normalized": true,
776
  "rstrip": false,
777
- "single_word": false,
778
- "special": true
779
  },
780
- "32092": {
781
  "content": "<extra_id_7>",
782
  "lstrip": true,
783
  "normalized": true,
784
  "rstrip": false,
785
- "single_word": false,
786
- "special": true
787
  },
788
- "32093": {
789
  "content": "<extra_id_6>",
790
  "lstrip": true,
791
  "normalized": true,
792
  "rstrip": false,
793
- "single_word": false,
794
- "special": true
795
  },
796
- "32094": {
797
  "content": "<extra_id_5>",
798
  "lstrip": true,
799
  "normalized": true,
800
  "rstrip": false,
801
- "single_word": false,
802
- "special": true
803
  },
804
- "32095": {
805
  "content": "<extra_id_4>",
806
  "lstrip": true,
807
  "normalized": true,
808
  "rstrip": false,
809
- "single_word": false,
810
- "special": true
811
  },
812
- "32096": {
813
  "content": "<extra_id_3>",
814
  "lstrip": true,
815
  "normalized": true,
816
  "rstrip": false,
817
- "single_word": false,
818
- "special": true
819
  },
820
- "32097": {
821
  "content": "<extra_id_2>",
822
  "lstrip": true,
823
  "normalized": true,
824
  "rstrip": false,
825
- "single_word": false,
826
- "special": true
827
  },
828
- "32098": {
829
  "content": "<extra_id_1>",
830
  "lstrip": true,
831
  "normalized": true,
832
  "rstrip": false,
833
- "single_word": false,
834
- "special": true
835
  },
836
- "32099": {
837
  "content": "<extra_id_0>",
838
  "lstrip": true,
839
  "normalized": true,
840
  "rstrip": false,
841
- "single_word": false,
842
- "special": true
843
  }
844
- },
845
- "additional_special_tokens": [
846
- "<extra_id_99>",
847
- "<extra_id_98>",
848
- "<extra_id_97>",
849
- "<extra_id_96>",
850
- "<extra_id_95>",
851
- "<extra_id_94>",
852
- "<extra_id_93>",
853
- "<extra_id_92>",
854
- "<extra_id_91>",
855
- "<extra_id_90>",
856
- "<extra_id_89>",
857
- "<extra_id_88>",
858
- "<extra_id_87>",
859
- "<extra_id_86>",
860
- "<extra_id_85>",
861
- "<extra_id_84>",
862
- "<extra_id_83>",
863
- "<extra_id_82>",
864
- "<extra_id_81>",
865
- "<extra_id_80>",
866
- "<extra_id_79>",
867
- "<extra_id_78>",
868
- "<extra_id_77>",
869
- "<extra_id_76>",
870
- "<extra_id_75>",
871
- "<extra_id_74>",
872
- "<extra_id_73>",
873
- "<extra_id_72>",
874
- "<extra_id_71>",
875
- "<extra_id_70>",
876
- "<extra_id_69>",
877
- "<extra_id_68>",
878
- "<extra_id_67>",
879
- "<extra_id_66>",
880
- "<extra_id_65>",
881
- "<extra_id_64>",
882
- "<extra_id_63>",
883
- "<extra_id_62>",
884
- "<extra_id_61>",
885
- "<extra_id_60>",
886
- "<extra_id_59>",
887
- "<extra_id_58>",
888
- "<extra_id_57>",
889
- "<extra_id_56>",
890
- "<extra_id_55>",
891
- "<extra_id_54>",
892
- "<extra_id_53>",
893
- "<extra_id_52>",
894
- "<extra_id_51>",
895
- "<extra_id_50>",
896
- "<extra_id_49>",
897
- "<extra_id_48>",
898
- "<extra_id_47>",
899
- "<extra_id_46>",
900
- "<extra_id_45>",
901
- "<extra_id_44>",
902
- "<extra_id_43>",
903
- "<extra_id_42>",
904
- "<extra_id_41>",
905
- "<extra_id_40>",
906
- "<extra_id_39>",
907
- "<extra_id_38>",
908
- "<extra_id_37>",
909
- "<extra_id_36>",
910
- "<extra_id_35>",
911
- "<extra_id_34>",
912
- "<extra_id_33>",
913
- "<extra_id_32>",
914
- "<extra_id_31>",
915
- "<extra_id_30>",
916
- "<extra_id_29>",
917
- "<extra_id_28>",
918
- "<extra_id_27>",
919
- "<extra_id_26>",
920
- "<extra_id_25>",
921
- "<extra_id_24>",
922
- "<extra_id_23>",
923
- "<extra_id_22>",
924
- "<extra_id_21>",
925
- "<extra_id_20>",
926
- "<extra_id_19>",
927
- "<extra_id_18>",
928
- "<extra_id_17>",
929
- "<extra_id_16>",
930
- "<extra_id_15>",
931
- "<extra_id_14>",
932
- "<extra_id_13>",
933
- "<extra_id_12>",
934
- "<extra_id_11>",
935
- "<extra_id_10>",
936
- "<extra_id_9>",
937
- "<extra_id_8>",
938
- "<extra_id_7>",
939
- "<extra_id_6>",
940
- "<extra_id_5>",
941
- "<extra_id_4>",
942
- "<extra_id_3>",
943
- "<extra_id_2>",
944
- "<extra_id_1>",
945
- "<extra_id_0>"
946
  ],
 
947
  "bos_token": "<s>",
948
- "clean_up_tokenization_spaces": false,
949
  "cls_token": "<s>",
950
  "eos_token": "</s>",
951
  "errors": "replace",
952
- "extra_special_tokens": {},
 
953
  "mask_token": "<mask>",
954
  "model_max_length": 512,
955
  "pad_token": "<pad>",
 
1
  {
2
  "add_prefix_space": false,
3
+ "additional_special_tokens": [
4
+ {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "content": "<extra_id_99>",
6
  "lstrip": true,
7
  "normalized": true,
8
  "rstrip": false,
9
+ "single_word": false
 
10
  },
11
+ {
12
  "content": "<extra_id_98>",
13
  "lstrip": true,
14
  "normalized": true,
15
  "rstrip": false,
16
+ "single_word": false
 
17
  },
18
+ {
19
  "content": "<extra_id_97>",
20
  "lstrip": true,
21
  "normalized": true,
22
  "rstrip": false,
23
+ "single_word": false
 
24
  },
25
+ {
26
  "content": "<extra_id_96>",
27
  "lstrip": true,
28
  "normalized": true,
29
  "rstrip": false,
30
+ "single_word": false
 
31
  },
32
+ {
33
  "content": "<extra_id_95>",
34
  "lstrip": true,
35
  "normalized": true,
36
  "rstrip": false,
37
+ "single_word": false
 
38
  },
39
+ {
40
  "content": "<extra_id_94>",
41
  "lstrip": true,
42
  "normalized": true,
43
  "rstrip": false,
44
+ "single_word": false
 
45
  },
46
+ {
47
  "content": "<extra_id_93>",
48
  "lstrip": true,
49
  "normalized": true,
50
  "rstrip": false,
51
+ "single_word": false
 
52
  },
53
+ {
54
  "content": "<extra_id_92>",
55
  "lstrip": true,
56
  "normalized": true,
57
  "rstrip": false,
58
+ "single_word": false
 
59
  },
60
+ {
61
  "content": "<extra_id_91>",
62
  "lstrip": true,
63
  "normalized": true,
64
  "rstrip": false,
65
+ "single_word": false
 
66
  },
67
+ {
68
  "content": "<extra_id_90>",
69
  "lstrip": true,
70
  "normalized": true,
71
  "rstrip": false,
72
+ "single_word": false
 
73
  },
74
+ {
75
  "content": "<extra_id_89>",
76
  "lstrip": true,
77
  "normalized": true,
78
  "rstrip": false,
79
+ "single_word": false
 
80
  },
81
+ {
82
  "content": "<extra_id_88>",
83
  "lstrip": true,
84
  "normalized": true,
85
  "rstrip": false,
86
+ "single_word": false
 
87
  },
88
+ {
89
  "content": "<extra_id_87>",
90
  "lstrip": true,
91
  "normalized": true,
92
  "rstrip": false,
93
+ "single_word": false
 
94
  },
95
+ {
96
  "content": "<extra_id_86>",
97
  "lstrip": true,
98
  "normalized": true,
99
  "rstrip": false,
100
+ "single_word": false
 
101
  },
102
+ {
103
  "content": "<extra_id_85>",
104
  "lstrip": true,
105
  "normalized": true,
106
  "rstrip": false,
107
+ "single_word": false
 
108
  },
109
+ {
110
  "content": "<extra_id_84>",
111
  "lstrip": true,
112
  "normalized": true,
113
  "rstrip": false,
114
+ "single_word": false
 
115
  },
116
+ {
117
  "content": "<extra_id_83>",
118
  "lstrip": true,
119
  "normalized": true,
120
  "rstrip": false,
121
+ "single_word": false
 
122
  },
123
+ {
124
  "content": "<extra_id_82>",
125
  "lstrip": true,
126
  "normalized": true,
127
  "rstrip": false,
128
+ "single_word": false
 
129
  },
130
+ {
131
  "content": "<extra_id_81>",
132
  "lstrip": true,
133
  "normalized": true,
134
  "rstrip": false,
135
+ "single_word": false
 
136
  },
137
+ {
138
  "content": "<extra_id_80>",
139
  "lstrip": true,
140
  "normalized": true,
141
  "rstrip": false,
142
+ "single_word": false
 
143
  },
144
+ {
145
  "content": "<extra_id_79>",
146
  "lstrip": true,
147
  "normalized": true,
148
  "rstrip": false,
149
+ "single_word": false
 
150
  },
151
+ {
152
  "content": "<extra_id_78>",
153
  "lstrip": true,
154
  "normalized": true,
155
  "rstrip": false,
156
+ "single_word": false
 
157
  },
158
+ {
159
  "content": "<extra_id_77>",
160
  "lstrip": true,
161
  "normalized": true,
162
  "rstrip": false,
163
+ "single_word": false
 
164
  },
165
+ {
166
  "content": "<extra_id_76>",
167
  "lstrip": true,
168
  "normalized": true,
169
  "rstrip": false,
170
+ "single_word": false
 
171
  },
172
+ {
173
  "content": "<extra_id_75>",
174
  "lstrip": true,
175
  "normalized": true,
176
  "rstrip": false,
177
+ "single_word": false
 
178
  },
179
+ {
180
  "content": "<extra_id_74>",
181
  "lstrip": true,
182
  "normalized": true,
183
  "rstrip": false,
184
+ "single_word": false
 
185
  },
186
+ {
187
  "content": "<extra_id_73>",
188
  "lstrip": true,
189
  "normalized": true,
190
  "rstrip": false,
191
+ "single_word": false
 
192
  },
193
+ {
194
  "content": "<extra_id_72>",
195
  "lstrip": true,
196
  "normalized": true,
197
  "rstrip": false,
198
+ "single_word": false
 
199
  },
200
+ {
201
  "content": "<extra_id_71>",
202
  "lstrip": true,
203
  "normalized": true,
204
  "rstrip": false,
205
+ "single_word": false
 
206
  },
207
+ {
208
  "content": "<extra_id_70>",
209
  "lstrip": true,
210
  "normalized": true,
211
  "rstrip": false,
212
+ "single_word": false
 
213
  },
214
+ {
215
  "content": "<extra_id_69>",
216
  "lstrip": true,
217
  "normalized": true,
218
  "rstrip": false,
219
+ "single_word": false
 
220
  },
221
+ {
222
  "content": "<extra_id_68>",
223
  "lstrip": true,
224
  "normalized": true,
225
  "rstrip": false,
226
+ "single_word": false
 
227
  },
228
+ {
229
  "content": "<extra_id_67>",
230
  "lstrip": true,
231
  "normalized": true,
232
  "rstrip": false,
233
+ "single_word": false
 
234
  },
235
+ {
236
  "content": "<extra_id_66>",
237
  "lstrip": true,
238
  "normalized": true,
239
  "rstrip": false,
240
+ "single_word": false
 
241
  },
242
+ {
243
  "content": "<extra_id_65>",
244
  "lstrip": true,
245
  "normalized": true,
246
  "rstrip": false,
247
+ "single_word": false
 
248
  },
249
+ {
250
  "content": "<extra_id_64>",
251
  "lstrip": true,
252
  "normalized": true,
253
  "rstrip": false,
254
+ "single_word": false
 
255
  },
256
+ {
257
  "content": "<extra_id_63>",
258
  "lstrip": true,
259
  "normalized": true,
260
  "rstrip": false,
261
+ "single_word": false
 
262
  },
263
+ {
264
  "content": "<extra_id_62>",
265
  "lstrip": true,
266
  "normalized": true,
267
  "rstrip": false,
268
+ "single_word": false
 
269
  },
270
+ {
271
  "content": "<extra_id_61>",
272
  "lstrip": true,
273
  "normalized": true,
274
  "rstrip": false,
275
+ "single_word": false
 
276
  },
277
+ {
278
  "content": "<extra_id_60>",
279
  "lstrip": true,
280
  "normalized": true,
281
  "rstrip": false,
282
+ "single_word": false
 
283
  },
284
+ {
285
  "content": "<extra_id_59>",
286
  "lstrip": true,
287
  "normalized": true,
288
  "rstrip": false,
289
+ "single_word": false
 
290
  },
291
+ {
292
  "content": "<extra_id_58>",
293
  "lstrip": true,
294
  "normalized": true,
295
  "rstrip": false,
296
+ "single_word": false
 
297
  },
298
+ {
299
  "content": "<extra_id_57>",
300
  "lstrip": true,
301
  "normalized": true,
302
  "rstrip": false,
303
+ "single_word": false
 
304
  },
305
+ {
306
  "content": "<extra_id_56>",
307
  "lstrip": true,
308
  "normalized": true,
309
  "rstrip": false,
310
+ "single_word": false
 
311
  },
312
+ {
313
  "content": "<extra_id_55>",
314
  "lstrip": true,
315
  "normalized": true,
316
  "rstrip": false,
317
+ "single_word": false
 
318
  },
319
+ {
320
  "content": "<extra_id_54>",
321
  "lstrip": true,
322
  "normalized": true,
323
  "rstrip": false,
324
+ "single_word": false
 
325
  },
326
+ {
327
  "content": "<extra_id_53>",
328
  "lstrip": true,
329
  "normalized": true,
330
  "rstrip": false,
331
+ "single_word": false
 
332
  },
333
+ {
334
  "content": "<extra_id_52>",
335
  "lstrip": true,
336
  "normalized": true,
337
  "rstrip": false,
338
+ "single_word": false
 
339
  },
340
+ {
341
  "content": "<extra_id_51>",
342
  "lstrip": true,
343
  "normalized": true,
344
  "rstrip": false,
345
+ "single_word": false
 
346
  },
347
+ {
348
  "content": "<extra_id_50>",
349
  "lstrip": true,
350
  "normalized": true,
351
  "rstrip": false,
352
+ "single_word": false
 
353
  },
354
+ {
355
  "content": "<extra_id_49>",
356
  "lstrip": true,
357
  "normalized": true,
358
  "rstrip": false,
359
+ "single_word": false
 
360
  },
361
+ {
362
  "content": "<extra_id_48>",
363
  "lstrip": true,
364
  "normalized": true,
365
  "rstrip": false,
366
+ "single_word": false
 
367
  },
368
+ {
369
  "content": "<extra_id_47>",
370
  "lstrip": true,
371
  "normalized": true,
372
  "rstrip": false,
373
+ "single_word": false
 
374
  },
375
+ {
376
  "content": "<extra_id_46>",
377
  "lstrip": true,
378
  "normalized": true,
379
  "rstrip": false,
380
+ "single_word": false
 
381
  },
382
+ {
383
  "content": "<extra_id_45>",
384
  "lstrip": true,
385
  "normalized": true,
386
  "rstrip": false,
387
+ "single_word": false
 
388
  },
389
+ {
390
  "content": "<extra_id_44>",
391
  "lstrip": true,
392
  "normalized": true,
393
  "rstrip": false,
394
+ "single_word": false
 
395
  },
396
+ {
397
  "content": "<extra_id_43>",
398
  "lstrip": true,
399
  "normalized": true,
400
  "rstrip": false,
401
+ "single_word": false
 
402
  },
403
+ {
404
  "content": "<extra_id_42>",
405
  "lstrip": true,
406
  "normalized": true,
407
  "rstrip": false,
408
+ "single_word": false
 
409
  },
410
+ {
411
  "content": "<extra_id_41>",
412
  "lstrip": true,
413
  "normalized": true,
414
  "rstrip": false,
415
+ "single_word": false
 
416
  },
417
+ {
418
  "content": "<extra_id_40>",
419
  "lstrip": true,
420
  "normalized": true,
421
  "rstrip": false,
422
+ "single_word": false
 
423
  },
424
+ {
425
  "content": "<extra_id_39>",
426
  "lstrip": true,
427
  "normalized": true,
428
  "rstrip": false,
429
+ "single_word": false
 
430
  },
431
+ {
432
  "content": "<extra_id_38>",
433
  "lstrip": true,
434
  "normalized": true,
435
  "rstrip": false,
436
+ "single_word": false
 
437
  },
438
+ {
439
  "content": "<extra_id_37>",
440
  "lstrip": true,
441
  "normalized": true,
442
  "rstrip": false,
443
+ "single_word": false
 
444
  },
445
+ {
446
  "content": "<extra_id_36>",
447
  "lstrip": true,
448
  "normalized": true,
449
  "rstrip": false,
450
+ "single_word": false
 
451
  },
452
+ {
453
  "content": "<extra_id_35>",
454
  "lstrip": true,
455
  "normalized": true,
456
  "rstrip": false,
457
+ "single_word": false
 
458
  },
459
+ {
460
  "content": "<extra_id_34>",
461
  "lstrip": true,
462
  "normalized": true,
463
  "rstrip": false,
464
+ "single_word": false
 
465
  },
466
+ {
467
  "content": "<extra_id_33>",
468
  "lstrip": true,
469
  "normalized": true,
470
  "rstrip": false,
471
+ "single_word": false
 
472
  },
473
+ {
474
  "content": "<extra_id_32>",
475
  "lstrip": true,
476
  "normalized": true,
477
  "rstrip": false,
478
+ "single_word": false
 
479
  },
480
+ {
481
  "content": "<extra_id_31>",
482
  "lstrip": true,
483
  "normalized": true,
484
  "rstrip": false,
485
+ "single_word": false
 
486
  },
487
+ {
488
  "content": "<extra_id_30>",
489
  "lstrip": true,
490
  "normalized": true,
491
  "rstrip": false,
492
+ "single_word": false
 
493
  },
494
+ {
495
  "content": "<extra_id_29>",
496
  "lstrip": true,
497
  "normalized": true,
498
  "rstrip": false,
499
+ "single_word": false
 
500
  },
501
+ {
502
  "content": "<extra_id_28>",
503
  "lstrip": true,
504
  "normalized": true,
505
  "rstrip": false,
506
+ "single_word": false
 
507
  },
508
+ {
509
  "content": "<extra_id_27>",
510
  "lstrip": true,
511
  "normalized": true,
512
  "rstrip": false,
513
+ "single_word": false
 
514
  },
515
+ {
516
  "content": "<extra_id_26>",
517
  "lstrip": true,
518
  "normalized": true,
519
  "rstrip": false,
520
+ "single_word": false
 
521
  },
522
+ {
523
  "content": "<extra_id_25>",
524
  "lstrip": true,
525
  "normalized": true,
526
  "rstrip": false,
527
+ "single_word": false
 
528
  },
529
+ {
530
  "content": "<extra_id_24>",
531
  "lstrip": true,
532
  "normalized": true,
533
  "rstrip": false,
534
+ "single_word": false
 
535
  },
536
+ {
537
  "content": "<extra_id_23>",
538
  "lstrip": true,
539
  "normalized": true,
540
  "rstrip": false,
541
+ "single_word": false
 
542
  },
543
+ {
544
  "content": "<extra_id_22>",
545
  "lstrip": true,
546
  "normalized": true,
547
  "rstrip": false,
548
+ "single_word": false
 
549
  },
550
+ {
551
  "content": "<extra_id_21>",
552
  "lstrip": true,
553
  "normalized": true,
554
  "rstrip": false,
555
+ "single_word": false
 
556
  },
557
+ {
558
  "content": "<extra_id_20>",
559
  "lstrip": true,
560
  "normalized": true,
561
  "rstrip": false,
562
+ "single_word": false
 
563
  },
564
+ {
565
  "content": "<extra_id_19>",
566
  "lstrip": true,
567
  "normalized": true,
568
  "rstrip": false,
569
+ "single_word": false
 
570
  },
571
+ {
572
  "content": "<extra_id_18>",
573
  "lstrip": true,
574
  "normalized": true,
575
  "rstrip": false,
576
+ "single_word": false
 
577
  },
578
+ {
579
  "content": "<extra_id_17>",
580
  "lstrip": true,
581
  "normalized": true,
582
  "rstrip": false,
583
+ "single_word": false
 
584
  },
585
+ {
586
  "content": "<extra_id_16>",
587
  "lstrip": true,
588
  "normalized": true,
589
  "rstrip": false,
590
+ "single_word": false
 
591
  },
592
+ {
593
  "content": "<extra_id_15>",
594
  "lstrip": true,
595
  "normalized": true,
596
  "rstrip": false,
597
+ "single_word": false
 
598
  },
599
+ {
600
  "content": "<extra_id_14>",
601
  "lstrip": true,
602
  "normalized": true,
603
  "rstrip": false,
604
+ "single_word": false
 
605
  },
606
+ {
607
  "content": "<extra_id_13>",
608
  "lstrip": true,
609
  "normalized": true,
610
  "rstrip": false,
611
+ "single_word": false
 
612
  },
613
+ {
614
  "content": "<extra_id_12>",
615
  "lstrip": true,
616
  "normalized": true,
617
  "rstrip": false,
618
+ "single_word": false
 
619
  },
620
+ {
621
  "content": "<extra_id_11>",
622
  "lstrip": true,
623
  "normalized": true,
624
  "rstrip": false,
625
+ "single_word": false
 
626
  },
627
+ {
628
  "content": "<extra_id_10>",
629
  "lstrip": true,
630
  "normalized": true,
631
  "rstrip": false,
632
+ "single_word": false
 
633
  },
634
+ {
635
  "content": "<extra_id_9>",
636
  "lstrip": true,
637
  "normalized": true,
638
  "rstrip": false,
639
+ "single_word": false
 
640
  },
641
+ {
642
  "content": "<extra_id_8>",
643
  "lstrip": true,
644
  "normalized": true,
645
  "rstrip": false,
646
+ "single_word": false
 
647
  },
648
+ {
649
  "content": "<extra_id_7>",
650
  "lstrip": true,
651
  "normalized": true,
652
  "rstrip": false,
653
+ "single_word": false
 
654
  },
655
+ {
656
  "content": "<extra_id_6>",
657
  "lstrip": true,
658
  "normalized": true,
659
  "rstrip": false,
660
+ "single_word": false
 
661
  },
662
+ {
663
  "content": "<extra_id_5>",
664
  "lstrip": true,
665
  "normalized": true,
666
  "rstrip": false,
667
+ "single_word": false
 
668
  },
669
+ {
670
  "content": "<extra_id_4>",
671
  "lstrip": true,
672
  "normalized": true,
673
  "rstrip": false,
674
+ "single_word": false
 
675
  },
676
+ {
677
  "content": "<extra_id_3>",
678
  "lstrip": true,
679
  "normalized": true,
680
  "rstrip": false,
681
+ "single_word": false
 
682
  },
683
+ {
684
  "content": "<extra_id_2>",
685
  "lstrip": true,
686
  "normalized": true,
687
  "rstrip": false,
688
+ "single_word": false
 
689
  },
690
+ {
691
  "content": "<extra_id_1>",
692
  "lstrip": true,
693
  "normalized": true,
694
  "rstrip": false,
695
+ "single_word": false
 
696
  },
697
+ {
698
  "content": "<extra_id_0>",
699
  "lstrip": true,
700
  "normalized": true,
701
  "rstrip": false,
702
+ "single_word": false
 
703
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
704
  ],
705
+ "backend": "tokenizers",
706
  "bos_token": "<s>",
 
707
  "cls_token": "<s>",
708
  "eos_token": "</s>",
709
  "errors": "replace",
710
+ "extra_special_tokens": [],
711
+ "is_local": false,
712
  "mask_token": "<mask>",
713
  "model_max_length": 512,
714
  "pad_token": "<pad>",