littlEndian commited on
Commit
c39f060
·
verified ·
1 Parent(s): e678b0b

Training in progress, step 240

Browse files
Files changed (4) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. tokenizer.json +47 -52
  4. training_args.bin +1 -1
config.json CHANGED
@@ -40,7 +40,7 @@
40
  "tie_word_embeddings": true,
41
  "type_vocab_size": 2,
42
  "use_cache": true,
43
- "vocab_size": 52
44
  },
45
  "decoder_start_token_id": 2,
46
  "dtype": "float32",
@@ -82,7 +82,7 @@
82
  "tie_word_embeddings": true,
83
  "type_vocab_size": 2,
84
  "use_cache": true,
85
- "vocab_size": 52
86
  },
87
  "eos_token_id": 0,
88
  "is_encoder_decoder": true,
 
40
  "tie_word_embeddings": true,
41
  "type_vocab_size": 2,
42
  "use_cache": true,
43
+ "vocab_size": 51
44
  },
45
  "decoder_start_token_id": 2,
46
  "dtype": "float32",
 
82
  "tie_word_embeddings": true,
83
  "type_vocab_size": 2,
84
  "use_cache": true,
85
+ "vocab_size": 51
86
  },
87
  "eos_token_id": 0,
88
  "is_encoder_decoder": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a536ec39ae7b8ced1396dd7d9a8a743afa77b2769e5d572b9815da9315edb6b2
3
- size 31205552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3482f92f4e87979e787d5f81c47fe290ef187ce2c6a4b12483ca7185c902425f
3
+ size 31203500
tokenizer.json CHANGED
@@ -113,76 +113,75 @@
113
  "7": 13,
114
  "8": 14,
115
  "9": 15,
116
- "10": 16,
117
- "99": 17,
118
- "98": 18,
119
- "11": 19,
120
- "12": 20,
121
- "97": 21,
122
- "96": 22,
123
- "13": 23,
124
  "14": 24,
125
  "95": 25,
126
  "15": 26,
127
  "94": 27,
128
- "16": 28,
129
- "93": 29,
130
  "92": 30,
131
  "17": 31,
132
- "91": 32,
133
- "18": 33,
134
- "19": 34,
135
- "90": 35,
136
  "20": 36,
137
  "89": 37,
138
- "88": 38,
139
- "21": 39,
140
  "22": 40,
141
  "87": 41,
142
- "86": 42,
143
- "23": 43,
144
  "24": 44,
145
  "85": 45,
146
  "25": 46,
147
  "84": 47,
148
  "26": 48,
149
  "83": 49,
150
- "27": 50,
151
- "82": 51
152
  },
153
  "merges": [
154
- [
155
- "1",
156
- "0"
157
- ],
158
  [
159
  "9",
160
  "9"
161
  ],
162
  [
163
- "9",
164
- "8"
165
  ],
166
  [
167
  "1",
168
  "1"
169
  ],
170
  [
171
- "1",
172
- "2"
173
  ],
174
  [
175
  "9",
176
  "7"
177
  ],
178
  [
179
- "9",
180
- "6"
181
  ],
182
  [
183
  "1",
184
  "3"
185
  ],
 
 
 
 
186
  [
187
  "1",
188
  "4"
@@ -199,14 +198,14 @@
199
  "9",
200
  "4"
201
  ],
202
- [
203
- "1",
204
- "6"
205
- ],
206
  [
207
  "9",
208
  "3"
209
  ],
 
 
 
 
210
  [
211
  "9",
212
  "2"
@@ -215,22 +214,22 @@
215
  "1",
216
  "7"
217
  ],
218
- [
219
- "9",
220
- "1"
221
- ],
222
  [
223
  "1",
224
  "8"
225
  ],
226
  [
227
- "1",
228
- "9"
229
  ],
230
  [
231
  "9",
232
  "0"
233
  ],
 
 
 
 
234
  [
235
  "2",
236
  "0"
@@ -239,14 +238,14 @@
239
  "8",
240
  "9"
241
  ],
242
- [
243
- "8",
244
- "8"
245
- ],
246
  [
247
  "2",
248
  "1"
249
  ],
 
 
 
 
250
  [
251
  "2",
252
  "2"
@@ -255,14 +254,14 @@
255
  "8",
256
  "7"
257
  ],
258
- [
259
- "8",
260
- "6"
261
- ],
262
  [
263
  "2",
264
  "3"
265
  ],
 
 
 
 
266
  [
267
  "2",
268
  "4"
@@ -287,10 +286,6 @@
287
  "8",
288
  "3"
289
  ],
290
- [
291
- "2",
292
- "7"
293
- ],
294
  [
295
  "8",
296
  "2"
 
113
  "7": 13,
114
  "8": 14,
115
  "9": 15,
116
+ "99": 16,
117
+ "10": 17,
118
+ "11": 18,
119
+ "98": 19,
120
+ "97": 20,
121
+ "12": 21,
122
+ "13": 22,
123
+ "96": 23,
124
  "14": 24,
125
  "95": 25,
126
  "15": 26,
127
  "94": 27,
128
+ "93": 28,
129
+ "16": 29,
130
  "92": 30,
131
  "17": 31,
132
+ "18": 32,
133
+ "91": 33,
134
+ "90": 34,
135
+ "19": 35,
136
  "20": 36,
137
  "89": 37,
138
+ "21": 38,
139
+ "88": 39,
140
  "22": 40,
141
  "87": 41,
142
+ "23": 42,
143
+ "86": 43,
144
  "24": 44,
145
  "85": 45,
146
  "25": 46,
147
  "84": 47,
148
  "26": 48,
149
  "83": 49,
150
+ "82": 50
 
151
  },
152
  "merges": [
 
 
 
 
153
  [
154
  "9",
155
  "9"
156
  ],
157
  [
158
+ "1",
159
+ "0"
160
  ],
161
  [
162
  "1",
163
  "1"
164
  ],
165
  [
166
+ "9",
167
+ "8"
168
  ],
169
  [
170
  "9",
171
  "7"
172
  ],
173
  [
174
+ "1",
175
+ "2"
176
  ],
177
  [
178
  "1",
179
  "3"
180
  ],
181
+ [
182
+ "9",
183
+ "6"
184
+ ],
185
  [
186
  "1",
187
  "4"
 
198
  "9",
199
  "4"
200
  ],
 
 
 
 
201
  [
202
  "9",
203
  "3"
204
  ],
205
+ [
206
+ "1",
207
+ "6"
208
+ ],
209
  [
210
  "9",
211
  "2"
 
214
  "1",
215
  "7"
216
  ],
 
 
 
 
217
  [
218
  "1",
219
  "8"
220
  ],
221
  [
222
+ "9",
223
+ "1"
224
  ],
225
  [
226
  "9",
227
  "0"
228
  ],
229
+ [
230
+ "1",
231
+ "9"
232
+ ],
233
  [
234
  "2",
235
  "0"
 
238
  "8",
239
  "9"
240
  ],
 
 
 
 
241
  [
242
  "2",
243
  "1"
244
  ],
245
+ [
246
+ "8",
247
+ "8"
248
+ ],
249
  [
250
  "2",
251
  "2"
 
254
  "8",
255
  "7"
256
  ],
 
 
 
 
257
  [
258
  "2",
259
  "3"
260
  ],
261
+ [
262
+ "8",
263
+ "6"
264
+ ],
265
  [
266
  "2",
267
  "4"
 
286
  "8",
287
  "3"
288
  ],
 
 
 
 
289
  [
290
  "8",
291
  "2"
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:357fa22415545d879a2d6b79d0baa4f85c4d2ec87f02cebe8c9c5a5d6cc27f49
3
  size 5329
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed73efd6078c7c5ea42244aee3fe3bf407cb8727dce914f606e81ba4b21b03a
3
  size 5329