Training in progress, step 160
Browse files- adapter_config.json +2 -2
- adapter_model.safetensors +1 -1
- dynamic_sampling_log.txt +149 -0
- tokenizer.json +2 -2
- training_args.bin +1 -1
adapter_config.json
CHANGED
|
@@ -30,11 +30,11 @@
|
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
"k_proj",
|
|
|
|
|
|
|
| 33 |
"down_proj",
|
| 34 |
"gate_proj",
|
| 35 |
-
"q_proj",
|
| 36 |
"up_proj",
|
| 37 |
-
"v_proj",
|
| 38 |
"o_proj"
|
| 39 |
],
|
| 40 |
"target_parameters": null,
|
|
|
|
| 30 |
"revision": null,
|
| 31 |
"target_modules": [
|
| 32 |
"k_proj",
|
| 33 |
+
"q_proj",
|
| 34 |
+
"v_proj",
|
| 35 |
"down_proj",
|
| 36 |
"gate_proj",
|
|
|
|
| 37 |
"up_proj",
|
|
|
|
| 38 |
"o_proj"
|
| 39 |
],
|
| 40 |
"target_parameters": null,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 335605144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b451663b0f74fae0d53a36528ab760d2b65a192a718f32817b524332befa494
|
| 3 |
size 335605144
|
dynamic_sampling_log.txt
CHANGED
|
@@ -1214,3 +1214,152 @@ Step Attempts Total Prompts Valid Prompts Efficiency
|
|
| 1214 |
149 3 18 6 33.3 %
|
| 1215 |
149 3 18 6 33.3 %
|
| 1216 |
149 4 24 6 25.0 %
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1214 |
149 3 18 6 33.3 %
|
| 1215 |
149 3 18 6 33.3 %
|
| 1216 |
149 4 24 6 25.0 %
|
| 1217 |
+
150 6 36 6 16.7 %
|
| 1218 |
+
150 5 30 6 20.0 %
|
| 1219 |
+
150 5 30 6 20.0 %
|
| 1220 |
+
150 5 30 6 20.0 %
|
| 1221 |
+
150 6 36 6 16.7 %
|
| 1222 |
+
150 2 12 6 50.0 %
|
| 1223 |
+
150 3 18 6 33.3 %
|
| 1224 |
+
150 1 6 6 100.0 %
|
| 1225 |
+
151 2 12 6 50.0 %
|
| 1226 |
+
151 3 18 6 33.3 %
|
| 1227 |
+
151 2 12 6 50.0 %
|
| 1228 |
+
151 3 18 6 33.3 %
|
| 1229 |
+
151 1 6 6 100.0 %
|
| 1230 |
+
151 3 18 6 33.3 %
|
| 1231 |
+
151 3 18 6 33.3 %
|
| 1232 |
+
151 5 30 6 20.0 %
|
| 1233 |
+
152 2 12 6 50.0 %
|
| 1234 |
+
152 1 6 6 100.0 %
|
| 1235 |
+
152 1 6 6 100.0 %
|
| 1236 |
+
152 3 18 6 33.3 %
|
| 1237 |
+
152 2 12 6 50.0 %
|
| 1238 |
+
152 2 12 6 50.0 %
|
| 1239 |
+
152 4 24 6 25.0 %
|
| 1240 |
+
152 2 12 6 50.0 %
|
| 1241 |
+
153 4 24 6 25.0 %
|
| 1242 |
+
153 1 6 6 100.0 %
|
| 1243 |
+
153 2 12 6 50.0 %
|
| 1244 |
+
153 4 24 6 25.0 %
|
| 1245 |
+
153 9 54 6 11.1 %
|
| 1246 |
+
153 2 12 6 50.0 %
|
| 1247 |
+
153 1 6 6 100.0 %
|
| 1248 |
+
153 8 48 6 12.5 %
|
| 1249 |
+
154 6 36 6 16.7 %
|
| 1250 |
+
154 4 24 6 25.0 %
|
| 1251 |
+
154 1 6 6 100.0 %
|
| 1252 |
+
154 6 36 6 16.7 %
|
| 1253 |
+
154 2 12 6 50.0 %
|
| 1254 |
+
154 3 18 6 33.3 %
|
| 1255 |
+
154 4 24 6 25.0 %
|
| 1256 |
+
154 2 12 6 50.0 %
|
| 1257 |
+
155 7 42 6 14.3 %
|
| 1258 |
+
155 2 12 6 50.0 %
|
| 1259 |
+
155 3 18 6 33.3 %
|
| 1260 |
+
155 2 12 6 50.0 %
|
| 1261 |
+
155 2 12 6 50.0 %
|
| 1262 |
+
155 3 18 6 33.3 %
|
| 1263 |
+
155 13 78 6 7.7 %
|
| 1264 |
+
155 2 12 6 50.0 %
|
| 1265 |
+
156 2 12 6 50.0 %
|
| 1266 |
+
156 4 24 6 25.0 %
|
| 1267 |
+
156 3 18 6 33.3 %
|
| 1268 |
+
156 3 18 6 33.3 %
|
| 1269 |
+
156 3 18 6 33.3 %
|
| 1270 |
+
156 5 30 6 20.0 %
|
| 1271 |
+
156 2 12 6 50.0 %
|
| 1272 |
+
156 2 12 6 50.0 %
|
| 1273 |
+
157 3 18 6 33.3 %
|
| 1274 |
+
157 5 30 6 20.0 %
|
| 1275 |
+
157 7 42 6 14.3 %
|
| 1276 |
+
157 5 30 6 20.0 %
|
| 1277 |
+
157 6 36 6 16.7 %
|
| 1278 |
+
157 4 24 6 25.0 %
|
| 1279 |
+
157 2 12 6 50.0 %
|
| 1280 |
+
157 3 18 6 33.3 %
|
| 1281 |
+
158 9 54 6 11.1 %
|
| 1282 |
+
158 2 12 6 50.0 %
|
| 1283 |
+
158 2 12 6 50.0 %
|
| 1284 |
+
158 4 24 6 25.0 %
|
| 1285 |
+
158 3 18 6 33.3 %
|
| 1286 |
+
150 2 12 6 50.0 %
|
| 1287 |
+
150 6 36 6 16.7 %
|
| 1288 |
+
150 4 24 6 25.0 %
|
| 1289 |
+
150 7 42 6 14.3 %
|
| 1290 |
+
150 3 18 6 33.3 %
|
| 1291 |
+
150 3 18 6 33.3 %
|
| 1292 |
+
150 1 6 6 100.0 %
|
| 1293 |
+
150 2 12 6 50.0 %
|
| 1294 |
+
151 2 12 6 50.0 %
|
| 1295 |
+
151 3 18 6 33.3 %
|
| 1296 |
+
151 4 24 6 25.0 %
|
| 1297 |
+
151 1 6 6 100.0 %
|
| 1298 |
+
151 8 48 6 12.5 %
|
| 1299 |
+
151 2 12 6 50.0 %
|
| 1300 |
+
151 3 18 6 33.3 %
|
| 1301 |
+
151 9 54 6 11.1 %
|
| 1302 |
+
152 4 24 6 25.0 %
|
| 1303 |
+
152 2 12 6 50.0 %
|
| 1304 |
+
152 8 48 6 12.5 %
|
| 1305 |
+
152 3 18 6 33.3 %
|
| 1306 |
+
152 2 12 6 50.0 %
|
| 1307 |
+
152 3 18 6 33.3 %
|
| 1308 |
+
152 2 12 6 50.0 %
|
| 1309 |
+
152 3 18 6 33.3 %
|
| 1310 |
+
153 6 36 6 16.7 %
|
| 1311 |
+
153 4 24 6 25.0 %
|
| 1312 |
+
153 5 30 6 20.0 %
|
| 1313 |
+
153 3 18 6 33.3 %
|
| 1314 |
+
153 3 18 6 33.3 %
|
| 1315 |
+
153 4 24 6 25.0 %
|
| 1316 |
+
153 4 24 6 25.0 %
|
| 1317 |
+
153 1 6 6 100.0 %
|
| 1318 |
+
154 6 36 6 16.7 %
|
| 1319 |
+
154 3 18 6 33.3 %
|
| 1320 |
+
154 2 12 6 50.0 %
|
| 1321 |
+
154 1 6 6 100.0 %
|
| 1322 |
+
154 2 12 6 50.0 %
|
| 1323 |
+
154 5 30 6 20.0 %
|
| 1324 |
+
154 2 12 6 50.0 %
|
| 1325 |
+
154 2 12 6 50.0 %
|
| 1326 |
+
155 3 18 6 33.3 %
|
| 1327 |
+
155 4 24 6 25.0 %
|
| 1328 |
+
155 10 60 6 10.0 %
|
| 1329 |
+
155 8 48 6 12.5 %
|
| 1330 |
+
155 5 30 6 20.0 %
|
| 1331 |
+
155 3 18 6 33.3 %
|
| 1332 |
+
155 8 48 6 12.5 %
|
| 1333 |
+
155 6 36 6 16.7 %
|
| 1334 |
+
156 3 18 6 33.3 %
|
| 1335 |
+
156 3 18 6 33.3 %
|
| 1336 |
+
156 6 36 6 16.7 %
|
| 1337 |
+
156 3 18 6 33.3 %
|
| 1338 |
+
156 1 6 6 100.0 %
|
| 1339 |
+
156 3 18 6 33.3 %
|
| 1340 |
+
156 1 6 6 100.0 %
|
| 1341 |
+
156 4 24 6 25.0 %
|
| 1342 |
+
157 5 30 6 20.0 %
|
| 1343 |
+
157 3 18 6 33.3 %
|
| 1344 |
+
157 4 24 6 25.0 %
|
| 1345 |
+
157 9 54 6 11.1 %
|
| 1346 |
+
157 4 24 6 25.0 %
|
| 1347 |
+
157 4 24 6 25.0 %
|
| 1348 |
+
157 6 36 6 16.7 %
|
| 1349 |
+
157 3 18 6 33.3 %
|
| 1350 |
+
158 3 18 6 33.3 %
|
| 1351 |
+
158 2 12 6 50.0 %
|
| 1352 |
+
158 5 30 6 20.0 %
|
| 1353 |
+
158 4 24 6 25.0 %
|
| 1354 |
+
158 4 24 6 25.0 %
|
| 1355 |
+
158 11 66 6 9.1 %
|
| 1356 |
+
158 5 30 6 20.0 %
|
| 1357 |
+
158 3 18 6 33.3 %
|
| 1358 |
+
159 8 48 6 12.5 %
|
| 1359 |
+
159 6 36 6 16.7 %
|
| 1360 |
+
159 6 36 6 16.7 %
|
| 1361 |
+
159 2 12 6 50.0 %
|
| 1362 |
+
159 8 48 6 12.5 %
|
| 1363 |
+
159 4 24 6 25.0 %
|
| 1364 |
+
159 4 24 6 25.0 %
|
| 1365 |
+
159 4 24 6 25.0 %
|
tokenizer.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26c881aaf4ef935b1516ec79ad6405dd2a459f2b5d431a8a4a1399c92f3ba022
|
| 3 |
+
size 17209711
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 8760
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f226307e55b90254d38ea4c353a35911a575a170c592310101fe03a927c9dc78
|
| 3 |
size 8760
|