jszot commited on
Commit
9ac39bd
·
verified ·
1 Parent(s): c1cbf0a

Training in progress, step 420

Browse files
Files changed (4) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. tokenizer.json +51 -55
  4. tokenizer_config.json +0 -1
config.json CHANGED
@@ -10,7 +10,7 @@
10
  "bos_token_id": null,
11
  "chunk_size_feed_forward": 0,
12
  "classifier_dropout": null,
13
- "dtype": "float32",
14
  "eos_token_id": null,
15
  "hidden_act": "gelu",
16
  "hidden_dropout_prob": 0.1,
@@ -52,7 +52,7 @@
52
  "bos_token_id": null,
53
  "chunk_size_feed_forward": 0,
54
  "classifier_dropout": null,
55
- "dtype": "float32",
56
  "eos_token_id": null,
57
  "hidden_act": "gelu",
58
  "hidden_dropout_prob": 0.1,
 
10
  "bos_token_id": null,
11
  "chunk_size_feed_forward": 0,
12
  "classifier_dropout": null,
13
+ "dtype": null,
14
  "eos_token_id": null,
15
  "hidden_act": "gelu",
16
  "hidden_dropout_prob": 0.1,
 
52
  "bos_token_id": null,
53
  "chunk_size_feed_forward": 0,
54
  "classifier_dropout": null,
55
+ "dtype": null,
56
  "eos_token_id": null,
57
  "hidden_act": "gelu",
58
  "hidden_dropout_prob": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38325a3f208b67a3b7d8b9c5b6f67317c0ea6e112eeb991707a152812f865e46
3
- size 31205528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e7346b4664d9f395023b6f04809b578d70106d9ba2b351dcdb92d850027e0d2
3
+ size 31205552
tokenizer.json CHANGED
@@ -113,55 +113,51 @@
113
  "7": 13,
114
  "8": 14,
115
  "9": 15,
116
- "10": 16,
117
  "99": 17,
118
- "98": 18,
119
  "11": 19,
120
- "97": 20,
121
  "12": 21,
122
- "96": 22,
123
  "13": 23,
124
- "95": 24,
125
- "14": 25,
126
- "15": 26,
127
  "94": 27,
128
- "93": 28,
129
  "16": 29,
130
- "17": 30,
131
- "92": 31,
132
- "18": 32,
133
- "91": 33,
134
- "90": 34,
135
  "19": 35,
136
- "20": 36,
137
  "89": 37,
138
- "21": 38,
139
- "88": 39,
140
- "87": 40,
141
  "22": 41,
142
- "23": 42,
143
  "86": 43,
144
- "85": 44,
145
- "24": 45,
146
- "25": 46,
147
- "84": 47,
148
- "83": 48,
149
  "26": 49,
150
- "27": 50,
151
  "82": 51
152
  },
153
  "merges": [
154
- [
155
- "1",
156
- "0"
157
- ],
158
  [
159
  "9",
160
  "9"
161
  ],
162
  [
163
- "9",
164
- "8"
165
  ],
166
  [
167
  "1",
@@ -169,7 +165,7 @@
169
  ],
170
  [
171
  "9",
172
- "7"
173
  ],
174
  [
175
  "1",
@@ -177,7 +173,7 @@
177
  ],
178
  [
179
  "9",
180
- "6"
181
  ],
182
  [
183
  "1",
@@ -185,28 +181,32 @@
185
  ],
186
  [
187
  "9",
188
- "5"
189
  ],
190
  [
191
- "1",
192
- "4"
193
  ],
194
  [
195
  "1",
196
- "5"
197
  ],
198
  [
199
  "9",
200
  "4"
201
  ],
202
  [
203
- "9",
204
- "3"
205
  ],
206
  [
207
  "1",
208
  "6"
209
  ],
 
 
 
 
210
  [
211
  "1",
212
  "7"
@@ -223,16 +223,12 @@
223
  "9",
224
  "1"
225
  ],
226
- [
227
- "9",
228
- "0"
229
- ],
230
  [
231
  "1",
232
  "9"
233
  ],
234
  [
235
- "2",
236
  "0"
237
  ],
238
  [
@@ -241,28 +237,32 @@
241
  ],
242
  [
243
  "2",
244
- "1"
245
  ],
246
  [
247
- "8",
248
- "8"
249
  ],
250
  [
251
  "8",
252
- "7"
253
  ],
254
  [
255
  "2",
256
  "2"
257
  ],
258
  [
259
- "2",
260
- "3"
261
  ],
262
  [
263
  "8",
264
  "6"
265
  ],
 
 
 
 
266
  [
267
  "8",
268
  "5"
@@ -279,17 +279,13 @@
279
  "8",
280
  "4"
281
  ],
282
- [
283
- "8",
284
- "3"
285
- ],
286
  [
287
  "2",
288
  "6"
289
  ],
290
  [
291
- "2",
292
- "7"
293
  ],
294
  [
295
  "8",
 
113
  "7": 13,
114
  "8": 14,
115
  "9": 15,
116
+ "=": 16,
117
  "99": 17,
118
+ "10": 18,
119
  "11": 19,
120
+ "98": 20,
121
  "12": 21,
122
+ "97": 22,
123
  "13": 23,
124
+ "96": 24,
125
+ "95": 25,
126
+ "14": 26,
127
  "94": 27,
128
+ "15": 28,
129
  "16": 29,
130
+ "93": 30,
131
+ "17": 31,
132
+ "92": 32,
133
+ "18": 33,
134
+ "91": 34,
135
  "19": 35,
136
+ "90": 36,
137
  "89": 37,
138
+ "20": 38,
139
+ "21": 39,
140
+ "88": 40,
141
  "22": 41,
142
+ "87": 42,
143
  "86": 43,
144
+ "23": 44,
145
+ "85": 45,
146
+ "24": 46,
147
+ "25": 47,
148
+ "84": 48,
149
  "26": 49,
150
+ "83": 50,
151
  "82": 51
152
  },
153
  "merges": [
 
 
 
 
154
  [
155
  "9",
156
  "9"
157
  ],
158
  [
159
+ "1",
160
+ "0"
161
  ],
162
  [
163
  "1",
 
165
  ],
166
  [
167
  "9",
168
+ "8"
169
  ],
170
  [
171
  "1",
 
173
  ],
174
  [
175
  "9",
176
+ "7"
177
  ],
178
  [
179
  "1",
 
181
  ],
182
  [
183
  "9",
184
+ "6"
185
  ],
186
  [
187
+ "9",
188
+ "5"
189
  ],
190
  [
191
  "1",
192
+ "4"
193
  ],
194
  [
195
  "9",
196
  "4"
197
  ],
198
  [
199
+ "1",
200
+ "5"
201
  ],
202
  [
203
  "1",
204
  "6"
205
  ],
206
+ [
207
+ "9",
208
+ "3"
209
+ ],
210
  [
211
  "1",
212
  "7"
 
223
  "9",
224
  "1"
225
  ],
 
 
 
 
226
  [
227
  "1",
228
  "9"
229
  ],
230
  [
231
+ "9",
232
  "0"
233
  ],
234
  [
 
237
  ],
238
  [
239
  "2",
240
+ "0"
241
  ],
242
  [
243
+ "2",
244
+ "1"
245
  ],
246
  [
247
  "8",
248
+ "8"
249
  ],
250
  [
251
  "2",
252
  "2"
253
  ],
254
  [
255
+ "8",
256
+ "7"
257
  ],
258
  [
259
  "8",
260
  "6"
261
  ],
262
+ [
263
+ "2",
264
+ "3"
265
+ ],
266
  [
267
  "8",
268
  "5"
 
279
  "8",
280
  "4"
281
  ],
 
 
 
 
282
  [
283
  "2",
284
  "6"
285
  ],
286
  [
287
+ "8",
288
+ "3"
289
  ],
290
  [
291
  "8",
tokenizer_config.json CHANGED
@@ -2,7 +2,6 @@
2
  "backend": "tokenizers",
3
  "cls_token": "[CLS]",
4
  "eos_token": "[EOS]",
5
- "is_local": false,
6
  "model_max_length": 1000000000000000019884624838656,
7
  "pad_token": "[PAD]",
8
  "tokenizer_class": "TokenizersBackend"
 
2
  "backend": "tokenizers",
3
  "cls_token": "[CLS]",
4
  "eos_token": "[EOS]",
 
5
  "model_max_length": 1000000000000000019884624838656,
6
  "pad_token": "[PAD]",
7
  "tokenizer_class": "TokenizersBackend"