Training in progress, step 500
Browse files- adapter_model.safetensors +1 -1
- debug.log +231 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6299896
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:872b413f45fca6c7860fa38c56a0e3fdec442e01d7cffd91710f403a865c8922
|
| 3 |
size 6299896
|
debug.log
CHANGED
|
@@ -1267,3 +1267,234 @@ trainable params: 1,572,864 || all params: 3,837,594,624 || trainable%: 0.0410
|
|
| 1267 |
|
| 1268 |
62%|ββββββββββββββββββββββββββββββββββββ | 400/650 [1:03:04<34:25, 8.26s/it]
|
| 1269 |
|
| 1270 |
|
| 1271 |
[A[2026-01-24 14:28:37,265] [INFO] [axolotl.core.trainers.base._save:721] [PID:9359] Saving model checkpoint to ./phi4_african_history_lora_out/checkpoint-400
|
|
|
|
| 1272 |
62%|βββββββββββββββββββββββββββββββββββ | 401/650 [1:03:13<1:42:25, 24.68s/it]
|
| 1273 |
62%|βββββββββββββββββββββββββββββββββββ | 402/650 [1:03:21<1:21:38, 19.75s/it]
|
| 1274 |
62%|βββββββββββββββββββββββββββββββββββ | 403/650 [1:03:27<1:04:39, 15.71s/it]
|
| 1275 |
62%|ββββββββββββββββββββββββββββββββββββ | 404/650 [1:03:37<57:40, 14.07s/it]
|
| 1276 |
62%|βββββββββββββββββββββββββββββββββββββ | 405/650 [1:03:46<50:18, 12.32s/it]
|
| 1277 |
|
|
|
|
| 1278 |
62%|βββββββββββββββββββββββββββββββββββββ | 405/650 [1:03:46<50:18, 12.32s/it]
|
| 1279 |
62%|βββββββββββββββββββββββββββββββββββββ | 406/650 [1:03:54<45:09, 11.10s/it]
|
| 1280 |
63%|βββββββββββββββββββββββββββββββββββββ | 407/650 [1:04:02<41:30, 10.25s/it]
|
| 1281 |
63%|βββββββββββββββββββββββββββββββββββββ | 408/650 [1:04:11<38:54, 9.65s/it]
|
| 1282 |
63%|βββββββββββββββββββββββββββββββββββββ | 409/650 [1:04:19<37:04, 9.23s/it]
|
| 1283 |
63%|βββββββββββββββββββββββββββββββββββββ | 410/650 [1:04:27<35:44, 8.93s/it]
|
| 1284 |
|
|
|
|
| 1285 |
63%|βββββββββββββββββββββββββββββββββββββ | 410/650 [1:04:27<35:44, 8.93s/it]
|
| 1286 |
63%|βββββββββββββββββββββββββββββββββββββ | 411/650 [1:04:35<34:45, 8.73s/it]
|
| 1287 |
63%|βββββββββββββββββββββββββββββββββββββ | 412/650 [1:04:43<34:02, 8.58s/it]
|
| 1288 |
64%|βββββββββββββββββββββββββββββββββββββ | 413/650 [1:04:52<33:30, 8.48s/it]
|
| 1289 |
64%|βββββββββββββββββββββββββββββββββββββ | 414/650 [1:05:00<33:05, 8.41s/it]
|
| 1290 |
64%|βββββββββββββββββββββββββββββββββββββ | 415/650 [1:05:08<32:45, 8.36s/it]
|
| 1291 |
|
|
|
|
| 1292 |
64%|ββββββββββββββββββββββββββββοΏ½οΏ½ββββββββ | 415/650 [1:05:08<32:45, 8.36s/it]
|
| 1293 |
64%|βββββββββββββββββββββββββββββββββββββ | 416/650 [1:05:14<30:08, 7.73s/it]
|
| 1294 |
64%|ββββββββββββββββββββββββββββββββββββββ | 417/650 [1:05:25<32:47, 8.45s/it]
|
| 1295 |
64%|ββββββββββββββββββββββββββββββββββββββ | 418/650 [1:05:33<32:25, 8.38s/it]
|
| 1296 |
64%|ββββββββββββββββββββββββββββββββββββββ | 419/650 [1:05:41<32:06, 8.34s/it]
|
| 1297 |
65%|ββββββββββββββββββββββββββββββββββββββ | 420/650 [1:05:49<31:51, 8.31s/it]
|
| 1298 |
|
|
|
|
| 1299 |
65%|ββββββββββββββββββββββββββββββββββββββ | 420/650 [1:05:49<31:51, 8.31s/it]
|
| 1300 |
65%|ββββββββββββββββββββββββββββββββββββββ | 421/650 [1:05:58<31:39, 8.30s/it]
|
| 1301 |
65%|ββββββββββββββββββββββββββββββββββββββ | 422/650 [1:06:06<31:28, 8.28s/it]
|
| 1302 |
65%|ββββββββββββββββββββββββββββββββββββββ | 423/650 [1:06:14<31:18, 8.27s/it]
|
| 1303 |
65%|ββββββββββββββββββββββββββββββββββββββ | 424/650 [1:06:22<31:08, 8.27s/it]
|
| 1304 |
65%|ββββββββββββββββββββββββββββββββββββββ | 425/650 [1:06:31<30:58, 8.26s/it]
|
| 1305 |
|
|
|
|
| 1306 |
65%|ββββββββββββββββββββββββββββββββββββββ | 425/650 [1:06:31<30:58, 8.26s/it]
|
| 1307 |
66%|ββββββββββββββββββββββββββββββββββββββ | 426/650 [1:06:39<30:49, 8.26s/it]
|
| 1308 |
66%|ββββββββββββββββββββββββββββββββββββββ | 427/650 [1:06:47<30:41, 8.26s/it]
|
| 1309 |
66%|βββββββββββββββββββββββββββββββββββββββ | 428/650 [1:06:55<30:32, 8.25s/it]
|
| 1310 |
66%|βββββββββββββββββββββββββββββββββββββββ | 429/650 [1:07:02<28:10, 7.65s/it]
|
| 1311 |
66%|βββββββββββββββββββββββββββββββββββββββ | 430/650 [1:07:12<30:46, 8.40s/it]
|
| 1312 |
|
|
|
|
| 1313 |
66%|βββββββββββββββββββββββββββββββββββββββ | 430/650 [1:07:12<30:46, 8.40s/it]
|
| 1314 |
66%|βββββββββββββββββββββββββββββββββββββββ | 431/650 [1:07:20<30:29, 8.35s/it]
|
| 1315 |
66%|βββββββββββββββββββββββββββββββββββββββ | 432/650 [1:07:28<30:14, 8.32s/it]
|
| 1316 |
67%|βββββββββββββββββββββββββββββββββββββββ | 433/650 [1:07:36<30:01, 8.30s/it]
|
| 1317 |
67%|ββοΏ½οΏ½ββββββββββββββββββββββββββββββββββββ | 434/650 [1:07:45<29:49, 8.29s/it]
|
| 1318 |
67%|βββββββββββββββββββββββββββββββββββββββ | 435/650 [1:07:53<29:38, 8.27s/it]
|
| 1319 |
|
|
|
|
| 1320 |
67%|βββββββββββββββββββββββββββββββββββββββ | 435/650 [1:07:53<29:38, 8.27s/it]
|
| 1321 |
67%|βββββββββββββββββββββββββββββββββββββββ | 436/650 [1:08:01<29:29, 8.27s/it]
|
| 1322 |
67%|βββββββββββββββββββββββββββββββββββββββ | 437/650 [1:08:09<29:19, 8.26s/it]
|
| 1323 |
67%|βββββββββββββββββββββββββββββββββββββββ | 438/650 [1:08:18<29:11, 8.26s/it]
|
| 1324 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 439/650 [1:08:26<29:02, 8.26s/it]
|
| 1325 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 440/650 [1:08:34<28:54, 8.26s/it]
|
| 1326 |
|
|
|
|
| 1327 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 440/650 [1:08:34<28:54, 8.26s/it]
|
| 1328 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 441/650 [1:08:43<28:46, 8.26s/it]
|
| 1329 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 442/650 [1:08:49<26:33, 7.66s/it]
|
| 1330 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 443/650 [1:08:59<28:59, 8.40s/it]
|
| 1331 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 444/650 [1:09:07<28:41, 8.36s/it]
|
| 1332 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 445/650 [1:09:15<28:26, 8.33s/it]
|
| 1333 |
|
|
|
|
| 1334 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 445/650 [1:09:15<28:26, 8.33s/it]
|
| 1335 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 446/650 [1:09:24<28:13, 8.30s/it]
|
| 1336 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 447/650 [1:09:32<28:02, 8.29s/it]
|
| 1337 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 448/650 [1:09:40<27:51, 8.28s/it]
|
| 1338 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 449/650 [1:09:48<27:41, 8.27s/it]
|
| 1339 |
69%|βββββββββββββββββββββββββββββββββββββββββ | 450/650 [1:09:57<27:32, 8.26s/it]
|
| 1340 |
|
|
|
|
| 1341 |
69%|βββββββββββββββββββββββββββββββββββββββββ | 450/650 [1:09:57<27:32, 8.26s/it][2026-01-24 14:35:30,194] [INFO] [axolotl.core.trainers.base.evaluate:400] [PID:9359] Running evaluation step...
|
|
|
|
|
|
|
| 1342 |
0%| | 0/100 [00:00<?, ?it/s][A
|
|
|
|
| 1343 |
2%|ββ | 2/100 [00:00<00:25, 3.85it/s][A
|
|
|
|
| 1344 |
3%|ββ | 3/100 [00:01<00:35, 2.71it/s][A
|
|
|
|
| 1345 |
4%|βββ | 4/100 [00:01<00:40, 2.35it/s][A
|
|
|
|
| 1346 |
5%|βββ | 5/100 [00:02<00:56, 1.69it/s][A
|
|
|
|
| 1347 |
6%|ββββ | 6/100 [00:02<00:53, 1.76it/s][A
|
|
|
|
| 1348 |
7%|βββββ | 7/100 [00:03<00:51, 1.81it/s][A
|
|
|
|
| 1349 |
8%|βββββ | 8/100 [00:04<00:50, 1.84it/s][A
|
|
|
|
| 1350 |
9%|ββββββ | 9/100 [00:04<00:50, 1.82it/s][A
|
|
|
|
| 1351 |
10%|ββββββ | 10/100 [00:05<00:48, 1.85it/s][A
|
|
|
|
| 1352 |
11%|βββββββ | 11/100 [00:05<00:47, 1.87it/s][A
|
|
|
|
| 1353 |
12%|ββββββββ | 12/100 [00:06<00:46, 1.89it/s][A
|
|
|
|
| 1354 |
13%|ββββββββ | 13/100 [00:06<00:46, 1.85it/s][A
|
|
|
|
| 1355 |
14%|βββββββββ | 14/100 [00:07<00:45, 1.87it/s][A
|
|
|
|
| 1356 |
15%|ββββββββββ | 15/100 [00:07<00:45, 1.89it/s][A
|
|
|
|
| 1357 |
16%|ββββββββββ | 16/100 [00:08<00:44, 1.90it/s][A
|
|
|
|
| 1358 |
17%|βββββββββββ | 17/100 [00:08<00:44, 1.86it/s][A
|
|
|
|
| 1359 |
18%|βββββββββββ | 18/100 [00:09<00:43, 1.88it/s][A
|
|
|
|
| 1360 |
19%|ββββββββββββ | 19/100 [00:09<00:42, 1.89it/s][A
|
|
|
|
| 1361 |
20%|βββββββββββββ | 20/100 [00:10<00:42, 1.90it/s][A
|
|
|
|
| 1362 |
21%|βββββββββββββ | 21/100 [00:10<00:42, 1.86it/s][A
|
|
|
|
| 1363 |
22%|ββββββββββββββ | 22/100 [00:11<00:41, 1.88it/s][A
|
|
|
|
| 1364 |
23%|ββββββββββββββ | 23/100 [00:12<00:40, 1.89it/s][A
|
|
|
|
| 1365 |
24%|βββββββββββββββ | 24/100 [00:12<00:40, 1.90it/s][A
|
|
|
|
| 1366 |
25%|ββββββββββββββββ | 25/100 [00:13<00:40, 1.86it/s][A
|
|
|
|
| 1367 |
26%|ββββββββββββββββ | 26/100 [00:13<00:39, 1.88it/s][A
|
|
|
|
| 1368 |
27%|βββββββββββββββββ | 27/100 [00:14<00:38, 1.89it/s][A
|
|
|
|
| 1369 |
28%|βββββββββββββββββ | 28/100 [00:14<00:37, 1.90it/s][A
|
|
|
|
| 1370 |
29%|ββββββββββββββββββ | 29/100 [00:15<00:38, 1.86it/s][A
|
|
|
|
| 1371 |
30%|βββββββββββββββββββ | 30/100 [00:15<00:37, 1.88it/s][A
|
|
|
|
| 1372 |
31%|βββββββββββββββββββ | 31/100 [00:16<00:36, 1.89it/s][A
|
|
|
|
| 1373 |
32%|ββββββββββββββββββββ | 32/100 [00:16<00:35, 1.90it/s][A
|
|
|
|
| 1374 |
33%|βββββββββββββββββββββ | 33/100 [00:17<00:36, 1.86it/s][A
|
|
|
|
| 1375 |
34%|βββββββββββββββββββββ | 34/100 [00:17<00:35, 1.88it/s][A
|
|
|
|
| 1376 |
35%|ββββββββββββββββββββββ | 35/100 [00:18<00:34, 1.89it/s][A
|
|
|
|
| 1377 |
36%|ββββββββββββββββββββββ | 36/100 [00:18<00:33, 1.90it/s][A
|
|
|
|
| 1378 |
37%|βββββββββββββββββββββββ | 37/100 [00:19<00:35, 1.79it/s][A
|
|
|
|
| 1379 |
38%|ββββββββββββββββββββββββ | 38/100 [00:19<00:32, 1.90it/s][A
|
|
|
|
| 1380 |
39%|ββββββββββββββββββββββββ | 39/100 [00:20<00:31, 1.91it/s][A
|
|
|
|
| 1381 |
40%|βββββββββββββββββββββββββ | 40/100 [00:21<00:31, 1.91it/s][A
|
|
|
|
| 1382 |
41%|βββββββββββββββββββββββββ | 41/100 [00:21<00:31, 1.87it/s][A
|
|
|
|
| 1383 |
42%|ββββββββββββββββββββββββββ | 42/100 [00:22<00:30, 1.89it/s][A
|
|
|
|
| 1384 |
43%|βββββββββββββββββββββββββββ | 43/100 [00:22<00:30, 1.89it/s][A
|
|
|
|
| 1385 |
44%|βββββββββββββββββββββββββββ | 44/100 [00:23<00:29, 1.90it/s][A
|
|
|
|
| 1386 |
45%|ββββββββββββββββββββββββββββ | 45/100 [00:23<00:29, 1.86it/s][A
|
|
|
|
| 1387 |
46%|ββββββββββββββββββββββββββββ | 46/100 [00:24<00:28, 1.88it/s][A
|
|
|
|
| 1388 |
47%|βββββββββββββββββββββββββββββ | 47/100 [00:24<00:28, 1.89it/s][A
|
|
|
|
| 1389 |
48%|ββββββββββββββββββββββββββββββ | 48/100 [00:25<00:27, 1.90it/s][A
|
|
|
|
| 1390 |
49%|ββββββββββββββββββββββββββββββ | 49/100 [00:25<00:27, 1.86it/s][A
|
|
|
|
| 1391 |
50%|βββββββββββββββββββββββββββββββ | 50/100 [00:26<00:26, 1.88it/s][A
|
|
|
|
| 1392 |
51%|βββββββββββββββββββββββββββββββ | 51/100 [00:26<00:25, 1.89it/s][A
|
|
|
|
| 1393 |
52%|ββββββββββββββββββββββββββββββββ | 52/100 [00:27<00:25, 1.90it/s][A
|
|
|
|
| 1394 |
53%|βββββββββββββββββββββββββββββββββ | 53/100 [00:27<00:25, 1.86it/s][A
|
|
|
|
| 1395 |
54%|βββββββββββββββββββββββββββββββββ | 54/100 [00:28<00:24, 1.88it/s][A
|
|
|
|
| 1396 |
55%|ββββββββββββββββββββββββββββββββββ | 55/100 [00:29<00:23, 1.89it/s][A
|
|
|
|
| 1397 |
56%|βββββββββββββββββββββββββββββββββββ | 56/100 [00:29<00:23, 1.90it/s][A
|
|
|
|
| 1398 |
57%|βββββββββββββββββββββββββββββββββββ | 57/100 [00:30<00:23, 1.86it/s][A
|
|
|
|
| 1399 |
58%|ββββββββββββββββββββββββββββββββββββ | 58/100 [00:30<00:22, 1.88it/s][A
|
|
|
|
| 1400 |
59%|ββββββββββββββββββββββββββββββββββββ | 59/100 [00:31<00:21, 1.89it/s][A
|
|
|
|
| 1401 |
60%|βββββββββββββββββββββββββββββββββββββ | 60/100 [00:31<00:21, 1.90it/s][A
|
|
|
|
| 1402 |
61%|ββββββββββββββββββββββββββββββββββββββ | 61/100 [00:32<00:20, 1.86it/s][A
|
|
|
|
| 1403 |
62%|ββββββββββββββββββββββββββββββββββββββ | 62/100 [00:32<00:20, 1.88it/s][A
|
|
|
|
| 1404 |
63%|βββββββββββββββββββββββββββββββββββββββ | 63/100 [00:33<00:19, 1.89it/s][A
|
|
|
|
| 1405 |
64%|βββββββββββββββββββββββββββββββββββββββ | 64/100 [00:33<00:18, 1.90it/s][A
|
|
|
|
| 1406 |
65%|ββββββββββββββββββββββββββββββββββββββββ | 65/100 [00:34<00:18, 1.86it/s][A
|
|
|
|
| 1407 |
66%|βββββββββββββββββββββββββββββββββββββββββ | 66/100 [00:34<00:18, 1.88it/s][A
|
|
|
|
| 1408 |
67%|βββββββββββββοΏ½οΏ½οΏ½βββββββββββββββββββββββββββ | 67/100 [00:35<00:17, 1.89it/s][A
|
|
|
|
| 1409 |
68%|ββββββββββββββββββββββββββββββββββββββββββ | 68/100 [00:35<00:16, 1.90it/s][A
|
|
|
|
| 1410 |
69%|ββββββββββββββββββββββββββββββββββββββββββ | 69/100 [00:36<00:16, 1.86it/s][A
|
|
|
|
| 1411 |
70%|βββββββββββββββββββββββββββββββββββββββββββ | 70/100 [00:36<00:15, 1.88it/s][A
|
|
|
|
| 1412 |
71%|ββββββββββββββββββββββββββββββββββββββββββββ | 71/100 [00:37<00:15, 1.89it/s][A
|
|
|
|
| 1413 |
72%|ββββββββββββββββββββββββββββββββββββββββββββ | 72/100 [00:38<00:14, 1.90it/s][A
|
|
|
|
| 1414 |
73%|βββββββββββββββββββββββββββββββββββββββββββββ | 73/100 [00:38<00:14, 1.86it/s][A
|
|
|
|
| 1415 |
74%|ββββββββββββββββββββββββββββββββββββββββββββββ | 74/100 [00:39<00:13, 1.88it/s][A
|
|
|
|
| 1416 |
75%|ββββββββββββββββββββββββββββββββββββββββββββββ | 75/100 [00:39<00:13, 1.89it/s][A
|
|
|
|
| 1417 |
76%|βββββββββββββββββββββββββββββββββββββββββββββββ | 76/100 [00:40<00:12, 1.90it/s][A
|
|
|
|
| 1418 |
77%|βββββββββββββββββββββββββββββββββββββββββββββββ | 77/100 [00:40<00:12, 1.86it/s][A
|
|
|
|
| 1419 |
78%|ββββββββββββββββββββββββββββββββββββββββββββββββ | 78/100 [00:41<00:11, 1.88it/s][A
|
|
|
|
| 1420 |
79%|βββββββββββββββββββββββββββββββββββββββββββββββββ | 79/100 [00:41<00:11, 1.89it/s][A
|
|
|
|
| 1421 |
80%|βββββββββββββββββββββββββββββββββββββββββββββββββ | 80/100 [00:42<00:10, 1.90it/s][A
|
|
|
|
| 1422 |
81%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 81/100 [00:42<00:10, 1.86it/s][A
|
|
|
|
| 1423 |
82%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 82/100 [00:43<00:09, 1.88it/s][A
|
|
|
|
| 1424 |
83%|βββββββββββββββββββββββββββββββββββββββββββββββββββ | 83/100 [00:43<00:08, 1.89it/s][A
|
|
|
|
| 1425 |
84%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 84/100 [00:44<00:08, 1.90it/s][A
|
|
|
|
| 1426 |
85%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 85/100 [00:44<00:08, 1.86it/s][A
|
|
|
|
| 1427 |
86%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 86/100 [00:45<00:07, 1.88it/s][A
|
|
|
|
| 1428 |
87%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 87/100 [00:46<00:06, 1.89it/s][A
|
|
|
|
| 1429 |
88%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 88/100 [00:46<00:06, 1.90it/s][A
|
|
|
|
| 1430 |
89%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 89/100 [00:47<00:05, 1.86it/s][A
|
|
|
|
| 1431 |
90%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 90/100 [00:47<00:05, 1.88it/s][A
|
|
|
|
| 1432 |
91%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 91/100 [00:48<00:04, 1.89it/s][A
|
|
|
|
| 1433 |
92%|βββββββββββββββββββββββββββββββββββοΏ½οΏ½ββββββββββββββββββββ | 92/100 [00:48<00:04, 1.90it/s][A
|
|
|
|
| 1434 |
93%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 93/100 [00:49<00:03, 1.86it/s][A
|
|
|
|
| 1435 |
94%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 94/100 [00:49<00:03, 1.88it/s][A
|
|
|
|
| 1436 |
95%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 95/100 [00:50<00:02, 1.89it/s][A
|
|
|
|
| 1437 |
96%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 96/100 [00:50<00:02, 1.90it/s][A
|
|
|
|
| 1438 |
97%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 97/100 [00:51<00:01, 1.86it/s][A
|
|
|
|
| 1439 |
98%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 98/100 [00:51<00:01, 1.88it/s][A
|
|
|
|
| 1440 |
99%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ| 99/100 [00:52<00:00, 1.89it/s][A
|
|
|
|
| 1441 |
|
|
|
|
| 1442 |
|
|
|
|
| 1443 |
69%|βββββββββββββββββββββββββββββββββββββββββ | 450/650 [1:10:51<27:32, 8.26s/it]
|
|
|
|
|
|
|
| 1444 |
[A
|
| 1445 |
69%|βββββββββββββββββββββββββββββββββββββββ | 451/650 [1:10:59<1:21:14, 24.49s/it]
|
| 1446 |
70%|βββββββββββββββββββββββββββββββββββββββ | 452/650 [1:11:07<1:04:45, 19.62s/it]
|
| 1447 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 453/650 [1:11:16<53:13, 16.21s/it]
|
| 1448 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 454/650 [1:11:24<45:08, 13.82s/it]
|
| 1449 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 455/650 [1:11:30<37:31, 11.55s/it]
|
| 1450 |
|
|
|
|
| 1451 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 455/650 [1:11:30<37:31, 11.55s/it]
|
| 1452 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 456/650 [1:11:40<35:56, 11.11s/it]
|
| 1453 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 457/650 [1:11:48<32:59, 10.26s/it]
|
| 1454 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 458/650 [1:11:57<30:53, 9.65s/it]
|
| 1455 |
71%|βββββββββββββββββββββββββββββββββββββββββ | 459/650 [1:12:05<29:23, 9.23s/it]
|
| 1456 |
71%|βββββββββββββββββββββββββββββββββββββββββ | 460/650 [1:12:13<28:17, 8.94s/it]
|
| 1457 |
|
|
|
|
| 1458 |
71%|βββββββββββββββββββββββββββββββββββββββββ | 460/650 [1:12:13<28:17, 8.94s/it]
|
| 1459 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 461/650 [1:12:21<27:29, 8.73s/it]
|
| 1460 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 462/650 [1:12:30<26:54, 8.59s/it]
|
| 1461 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 463/650 [1:12:38<26:26, 8.48s/it]
|
| 1462 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 464/650 [1:12:46<26:04, 8.41s/it]
|
| 1463 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 465/650 [1:12:54<25:46, 8.36s/it]
|
| 1464 |
|
|
|
|
| 1465 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 465/650 [1:12:54<25:46, 8.36s/it]
|
| 1466 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 466/650 [1:13:03<25:31, 8.32s/it]
|
| 1467 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 467/650 [1:13:11<25:18, 8.30s/it]
|
| 1468 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 468/650 [1:13:17<23:18, 7.68s/it]
|
| 1469 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 469/650 [1:13:27<25:25, 8.43s/it]
|
| 1470 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 470/650 [1:13:35<25:07, 8.37s/it]
|
| 1471 |
|
|
|
|
| 1472 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 470/650 [1:13:35<25:07, 8.37s/it]
|
| 1473 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 471/650 [1:13:44<24:51, 8.33s/it]
|
| 1474 |
73%|ββββββββββββββββββββββββββββββββββββββββββ | 472/650 [1:13:52<24:38, 8.30s/it]
|
| 1475 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 473/650 [1:14:00<24:27, 8.29s/it]
|
| 1476 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 474/650 [1:14:08<24:16, 8.27s/it]
|
| 1477 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 475/650 [1:14:17<24:07, 8.27s/it]
|
| 1478 |
|
|
|
|
| 1479 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 475/650 [1:14:17<24:07, 8.27s/it]
|
| 1480 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 476/650 [1:14:25<23:57, 8.26s/it]
|
| 1481 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 477/650 [1:14:33<23:48, 8.26s/it]
|
| 1482 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 478/650 [1:14:41<23:39, 8.25s/it]
|
| 1483 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 479/650 [1:14:50<23:30, 8.25s/it]
|
| 1484 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 480/650 [1:14:58<23:21, 8.24s/it]
|
| 1485 |
|
|
|
|
| 1486 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 480/650 [1:14:58<23:21, 8.24s/it]
|
| 1487 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 481/650 [1:15:04<21:31, 7.64s/it]
|
| 1488 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 482/650 [1:15:14<23:28, 8.38s/it]
|
| 1489 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 483/650 [1:15:23<23:13, 8.34s/it]
|
| 1490 |
74%|ββββββββββββββββββββββββββββββββββββββββββββ | 484/650 [1:15:31<22:59, 8.31s/it]
|
| 1491 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 485/650 [1:15:39<22:47, 8.29s/it]
|
| 1492 |
|
|
|
|
| 1493 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 485/650 [1:15:39<22:47, 8.29s/it]
|
| 1494 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 486/650 [1:15:47<22:37, 8.28s/it]
|
| 1495 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 487/650 [1:15:55<22:27, 8.27s/it]
|
| 1496 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 488/650 [1:16:04<22:17, 8.26s/it]
|
| 1497 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 489/650 [1:16:12<22:09, 8.25s/it]
|
| 1498 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 490/650 [1:16:20<22:00, 8.25s/it]
|
| 1499 |
|
|
|
|
| 1500 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 490/650 [1:16:20<22:00, 8.25s/it]
|
| 1501 |
76%|ββββββββββββββββββοΏ½οΏ½οΏ½βββββββββββββββββββββββββ | 491/650 [1:16:28<21:51, 8.25s/it]
|
| 1502 |
76%|ββββββββββββββββββββββββββββββββββββββββββββ | 492/650 [1:16:37<21:42, 8.24s/it]
|
| 1503 |
76%|ββββββββββββββββββββββββββββββββββββββββββββ | 493/650 [1:16:45<21:34, 8.25s/it]
|
| 1504 |
76%|ββββββββββββββββββββββββββββββββββββββββββββ | 494/650 [1:16:51<19:52, 7.65s/it]
|
| 1505 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 495/650 [1:17:01<21:41, 8.40s/it]
|
| 1506 |
|
|
|
|
| 1507 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 495/650 [1:17:01<21:41, 8.40s/it]
|
| 1508 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 496/650 [1:17:10<21:26, 8.35s/it]
|
| 1509 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 497/650 [1:17:18<21:12, 8.32s/it]
|
| 1510 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 498/650 [1:17:26<21:00, 8.29s/it]
|
| 1511 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 499/650 [1:17:34<20:49, 8.28s/it]
|
| 1512 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 500/650 [1:17:43<20:39, 8.27s/it]
|
| 1513 |
|
|
|
|
| 1514 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 500/650 [1:17:43<20:39, 8.27s/it][2026-01-24 14:43:16,073] [INFO] [axolotl.core.trainers.base.evaluate:400] [PID:9359] Running evaluation step...
|
|
|
|
|
|
|
| 1515 |
0%| | 0/100 [00:00<?, ?it/s][A
|
|
|
|
| 1516 |
2%|ββ | 2/100 [00:00<00:25, 3.86it/s][A
|
|
|
|
| 1517 |
3%|ββ | 3/100 [00:01<00:35, 2.72it/s][A
|
|
|
|
| 1518 |
4%|βββ | 4/100 [00:01<00:40, 2.35it/s][A
|
|
|
|
| 1519 |
5%|βββ | 5/100 [00:02<00:54, 1.75it/s][A
|
|
|
|
| 1520 |
6%|ββββ | 6/100 [00:02<00:52, 1.81it/s][A
|
|
|
|
| 1521 |
7%|βββββ | 7/100 [00:03<00:50, 1.84it/s][A
|
|
|
|
| 1522 |
8%|βββββ | 8/100 [00:03<00:49, 1.87it/s][A
|
|
|
|
| 1523 |
9%|ββββββ | 9/100 [00:04<00:49, 1.84it/s][A
|
|
|
|
| 1524 |
10%|ββββββ | 10/100 [00:05<00:48, 1.87it/s][A
|
|
|
|
| 1525 |
11%|βββββββ | 11/100 [00:05<00:47, 1.88it/s][A
|
|
|
|
| 1526 |
12%|ββββββββ | 12/100 [00:06<00:46, 1.89it/s][A
|
|
|
|
| 1527 |
13%|ββββββββ | 13/100 [00:06<00:46, 1.86it/s][A
|
|
|
|
| 1528 |
14%|βββββββββ | 14/100 [00:07<00:45, 1.88it/s][A
|
|
|
|
| 1529 |
15%|ββββββββββ | 15/100 [00:07<00:44, 1.89it/s][A
|
|
|
|
| 1530 |
16%|ββββββββββ | 16/100 [00:08<00:44, 1.90it/s][A
|
|
|
|
| 1531 |
17%|βββββββββββ | 17/100 [00:08<00:44, 1.86it/s][A
|
|
|
|
| 1532 |
18%|βββββββββββ | 18/100 [00:09<00:43, 1.89it/s][A
|
|
|
|
| 1533 |
19%|ββββββββββββ | 19/100 [00:09<00:42, 1.90it/s][A
|
|
|
|
| 1534 |
20%|βββββββββββββ | 20/100 [00:10<00:42, 1.90it/s][A
|
|
|
|
| 1535 |
21%|βββββββββββββ | 21/100 [00:10<00:42, 1.86it/s][A
|
|
|
|
| 1536 |
22%|ββββββββββββββ | 22/100 [00:11<00:41, 1.88it/s][A
|
|
|
|
| 1537 |
23%|ββββββββββββββ | 23/100 [00:11<00:40, 1.89it/s][A
|
|
|
|
| 1538 |
24%|βββββββββββββββ | 24/100 [00:12<00:39, 1.90it/s][A
|
|
|
|
| 1539 |
25%|ββββββββββββββββ | 25/100 [00:13<00:40, 1.86it/s][A
|
|
|
|
| 1540 |
26%|ββββββββββββββββ | 26/100 [00:13<00:39, 1.88it/s][A
|
|
|
|
| 1541 |
27%|βββββββββββββββββ | 27/100 [00:14<00:38, 1.89it/s][A
|
|
|
|
| 1542 |
28%|βββββββββββββββββ | 28/100 [00:14<00:37, 1.90it/s][A
|
|
|
|
| 1543 |
29%|ββββββββββββββββββ | 29/100 [00:15<00:38, 1.86it/s][A
|
|
|
|
| 1544 |
30%|βββββββββββββββββββ | 30/100 [00:15<00:37, 1.88it/s][A
|
|
|
|
| 1545 |
31%|βββββββββββββββββββ | 31/100 [00:16<00:36, 1.89it/s][A
|
|
|
|
| 1546 |
32%|ββββββββββββββββββββ | 32/100 [00:16<00:35, 1.90it/s][A
|
|
|
|
| 1547 |
33%|βββββββββββββββββββββ | 33/100 [00:17<00:35, 1.86it/s][A
|
|
|
|
| 1548 |
34%|βββββββββββββββββββββ | 34/100 [00:17<00:35, 1.88it/s][A
|
|
|
|
| 1549 |
35%|ββββββββββββββββββββββ | 35/100 [00:18<00:34, 1.89it/s][A
|
|
|
|
| 1550 |
36%|ββββββββββββββββββββββ | 36/100 [00:18<00:33, 1.90it/s][A
|
|
|
|
| 1551 |
37%|βββββββββββββββββββββββ | 37/100 [00:19<00:33, 1.86it/s][A
|
|
|
|
| 1552 |
38%|ββββββββββββββββββββββββ | 38/100 [00:19<00:32, 1.88it/s][A
|
|
|
|
| 1553 |
39%|ββββββββββββββββββββββββ | 39/100 [00:20<00:32, 1.89it/s][A
|
|
|
|
| 1554 |
40%|βββββββββββββββββββββββββ | 40/100 [00:20<00:31, 1.90it/s][A
|
|
|
|
| 1555 |
41%|βββββββββββββββββββββββββ | 41/100 [00:21<00:31, 1.86it/s][A
|
|
|
|
| 1556 |
42%|ββββββββββββββββββββββββββ | 42/100 [00:22<00:30, 1.88it/s][A
|
|
|
|
| 1557 |
43%|βββββββββββββββββββββββββββ | 43/100 [00:22<00:30, 1.89it/s][A
|
|
|
|
| 1558 |
44%|βββββββββββββββββββββββββββ | 44/100 [00:23<00:29, 1.90it/s][A
|
|
|
|
| 1559 |
45%|ββββββββββββββββββββββββββββ | 45/100 [00:23<00:29, 1.86it/s][A
|
|
|
|
| 1560 |
46%|ββββββββββββββββββββββββββββ | 46/100 [00:24<00:28, 1.88it/s][A
|
|
|
|
| 1561 |
47%|βββββββββββββββββββββββββββββ | 47/100 [00:24<00:28, 1.89it/s][A
|
|
|
|
| 1562 |
48%|ββββββββββββββββββββββββββββββ | 48/100 [00:25<00:27, 1.90it/s][A
|
|
|
|
| 1563 |
49%|ββββββββββββββββββββββββββββββ | 49/100 [00:25<00:27, 1.86it/s][A
|
|
|
|
| 1564 |
50%|βββββββββββββββββββββββββββββββ | 50/100 [00:26<00:26, 1.88it/s][A
|
|
|
|
| 1565 |
51%|βββββββββββββββββββββββββββββββ | 51/100 [00:26<00:25, 1.89it/s][A
|
|
|
|
| 1566 |
52%|βββββοΏ½οΏ½ββββββββββββββββββββββββββ | 52/100 [00:27<00:25, 1.90it/s][A
|
|
|
|
| 1567 |
53%|βββββββββββββββββββββββββββββββββ | 53/100 [00:27<00:25, 1.86it/s][A
|
|
|
|
| 1568 |
54%|βββββββββββββββββββββββββββββββββ | 54/100 [00:28<00:24, 1.88it/s][A
|
|
|
|
| 1569 |
55%|ββββββββββββββββββββββββββββββββββ | 55/100 [00:28<00:23, 1.89it/s][A
|
|
|
|
| 1570 |
56%|βββββββββββββββββββββββββββββββββββ | 56/100 [00:29<00:23, 1.90it/s][A
|
|
|
|
| 1571 |
57%|βββββββββββββββββββββββββββββββββββ | 57/100 [00:29<00:23, 1.86it/s][A
|
|
|
|
| 1572 |
58%|ββββββββββββββββββββββββββββββββββββ | 58/100 [00:30<00:22, 1.88it/s][A
|
|
|
|
| 1573 |
59%|ββββββββββββββββββββββββββββββββββββ | 59/100 [00:31<00:21, 1.89it/s][A
|
|
|
|
| 1574 |
60%|βββββββββββββββββββββββββββββββββββββ | 60/100 [00:31<00:21, 1.90it/s][A
|
|
|
|
| 1575 |
61%|ββββββββββββββββββββββββββββββββββββββ | 61/100 [00:32<00:20, 1.86it/s][A
|
|
|
|
| 1576 |
62%|ββββββββββββββββββββββββββββββββββββββ | 62/100 [00:32<00:20, 1.88it/s][A
|
|
|
|
| 1577 |
63%|βββββββββββββββββββββββββββββββββββββββ | 63/100 [00:33<00:19, 1.89it/s][A
|
|
|
|
| 1578 |
64%|βββββββββββββββββββββββββββββββββββββββ | 64/100 [00:33<00:18, 1.90it/s][A
|
|
|
|
| 1579 |
65%|ββββββββββββββββββββββββββββββββββββββββ | 65/100 [00:34<00:18, 1.86it/s][A
|
|
|
|
| 1580 |
66%|βββββββββββββββββββββββββββββββββββββββββ | 66/100 [00:34<00:18, 1.88it/s][A
|
|
|
|
| 1581 |
67%|βββββββββββββββββββββββββββββββββββββββββ | 67/100 [00:35<00:17, 1.89it/s][A
|
|
|
|
| 1582 |
68%|ββββββββββββββββββββββββββββββββββββββββββ | 68/100 [00:35<00:16, 1.90it/s][A
|
|
|
|
| 1583 |
69%|ββββββββββββββββββββββββββββββββββββββββββ | 69/100 [00:36<00:16, 1.86it/s][A
|
|
|
|
| 1584 |
70%|βββββββββββββββββββββββββββββββββββββββββββ | 70/100 [00:36<00:15, 1.88it/s][A
|
|
|
|
| 1585 |
71%|ββββββββββββββββββββββββββββββββββββββββββββ | 71/100 [00:37<00:15, 1.89it/s][A
|
|
|
|
| 1586 |
72%|ββββββββββββββββββββββββββββββββββββββββββββ | 72/100 [00:37<00:14, 1.90it/s][A
|
|
|
|
| 1587 |
73%|βββββββββββββββββββββββββββββββββββββββββββββ | 73/100 [00:38<00:14, 1.86it/s][A
|
|
|
|
| 1588 |
74%|ββββββββββββββββββββββββββββββββββββββββββββββ | 74/100 [00:39<00:13, 1.88it/s][A
|
|
|
|
| 1589 |
75%|ββββββββββββββββββββββββββββββββββββββββββββββ | 75/100 [00:39<00:13, 1.89it/s][A
|
|
|
|
| 1590 |
76%|βββββββββββββββββββββββββββββββββββββββββββββββ | 76/100 [00:40<00:12, 1.90it/s][A
|
|
|
|
| 1591 |
77%|βββββββββββββββββββββββββββββββββββββββββββββββ | 77/100 [00:40<00:12, 1.86it/s][A
|
|
|
|
| 1592 |
78%|ββββββββββββββββββββββββββββββββββββββββββββββββ | 78/100 [00:41<00:11, 1.88it/s][A
|
|
|
|
| 1593 |
79%|ββββββββββββββββββββββββββββββββββββββββββββββοΏ½οΏ½ββ | 79/100 [00:41<00:11, 1.89it/s][A
|
|
|
|
| 1594 |
80%|βββββββββββββββββββββββββββββββββββββββββββββββββ | 80/100 [00:42<00:10, 1.90it/s][A
|
|
|
|
| 1595 |
81%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 81/100 [00:42<00:10, 1.86it/s][A
|
|
|
|
| 1596 |
82%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 82/100 [00:43<00:09, 1.88it/s][A
|
|
|
|
| 1597 |
83%|βββββββββββββββββββββββββββββββββββββββββββββββββββ | 83/100 [00:43<00:08, 1.89it/s][A
|
|
|
|
| 1598 |
84%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 84/100 [00:44<00:08, 1.90it/s][A
|
|
|
|
| 1599 |
85%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 85/100 [00:44<00:08, 1.86it/s][A
|
|
|
|
| 1600 |
86%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 86/100 [00:45<00:07, 1.88it/s][A
|
|
|
|
| 1601 |
87%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 87/100 [00:45<00:06, 1.89it/s][A
|
|
|
|
| 1602 |
88%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 88/100 [00:46<00:06, 1.90it/s][A
|
|
|
|
| 1603 |
89%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 89/100 [00:47<00:05, 1.86it/s][A
|
|
|
|
| 1604 |
90%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 90/100 [00:47<00:05, 1.88it/s][A
|
|
|
|
| 1605 |
91%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 91/100 [00:48<00:04, 1.89it/s][A
|
|
|
|
| 1606 |
92%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 92/100 [00:48<00:04, 1.90it/s][A
|
|
|
|
| 1607 |
93%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 93/100 [00:49<00:03, 1.86it/s][A
|
|
|
|
| 1608 |
94%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 94/100 [00:49<00:03, 1.88it/s][A
|
|
|
|
| 1609 |
95%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 95/100 [00:50<00:02, 1.89it/s][A
|
|
|
|
| 1610 |
96%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 96/100 [00:50<00:02, 1.90it/s][A
|
|
|
|
| 1611 |
97%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 97/100 [00:51<00:01, 1.86it/s][A
|
|
|
|
| 1612 |
98%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 98/100 [00:51<00:01, 1.88it/s][A
|
|
|
|
| 1613 |
99%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ| 99/100 [00:52<00:00, 1.89it/s][A
|
|
|
|
| 1614 |
|
|
|
|
| 1615 |
|
|
|
|
| 1616 |
77%|ββββββοΏ½οΏ½οΏ½ββββββββββββββββββββββββββββββββββββββ | 500/650 [1:18:37<20:39, 8.27s/it]
|
|
|
|
|
|
|
| 1617 |
[A[2026-01-24 14:44:10,048] [INFO] [axolotl.core.trainers.base._save:721] [PID:9359] Saving model checkpoint to ./phi4_african_history_lora_out/checkpoint-500
|
|
|
|
| 1267 |
|
| 1268 |
62%|ββββββββββββββββββββββββββββββββββββ | 400/650 [1:03:04<34:25, 8.26s/it]
|
| 1269 |
|
| 1270 |
|
| 1271 |
[A[2026-01-24 14:28:37,265] [INFO] [axolotl.core.trainers.base._save:721] [PID:9359] Saving model checkpoint to ./phi4_african_history_lora_out/checkpoint-400
|
| 1272 |
+
|
| 1273 |
62%|βββββββββββββββββββββββββββββββββββ | 401/650 [1:03:13<1:42:25, 24.68s/it]
|
| 1274 |
62%|βββββββββββββββββββββββββββββββββββ | 402/650 [1:03:21<1:21:38, 19.75s/it]
|
| 1275 |
62%|βββββββββββββββββββββββββββββββββββ | 403/650 [1:03:27<1:04:39, 15.71s/it]
|
| 1276 |
62%|ββββββββββββββββββββββββββββββββββββ | 404/650 [1:03:37<57:40, 14.07s/it]
|
| 1277 |
62%|βββββββββββββββββββββββββββββββββββββ | 405/650 [1:03:46<50:18, 12.32s/it]
|
| 1278 |
|
| 1279 |
+
|
| 1280 |
62%|βββββββββββββββββββββββββββββββββββββ | 405/650 [1:03:46<50:18, 12.32s/it]
|
| 1281 |
62%|βββββββββββββββββββββββββββββββββββββ | 406/650 [1:03:54<45:09, 11.10s/it]
|
| 1282 |
63%|βββββββββββββββββββββββββββββββββββββ | 407/650 [1:04:02<41:30, 10.25s/it]
|
| 1283 |
63%|βββββββββββββββββββββββββββββββββββββ | 408/650 [1:04:11<38:54, 9.65s/it]
|
| 1284 |
63%|βββββββββββββββββββββββββββββββββββββ | 409/650 [1:04:19<37:04, 9.23s/it]
|
| 1285 |
63%|βββββββββββββββββββββββββββββββββββββ | 410/650 [1:04:27<35:44, 8.93s/it]
|
| 1286 |
|
| 1287 |
+
|
| 1288 |
63%|βββββββββββββββββββββββββββββββββββββ | 410/650 [1:04:27<35:44, 8.93s/it]
|
| 1289 |
63%|βββββββββββββββββββββββββββββββββββββ | 411/650 [1:04:35<34:45, 8.73s/it]
|
| 1290 |
63%|βββββββββββββββββββββββββββββββββββββ | 412/650 [1:04:43<34:02, 8.58s/it]
|
| 1291 |
64%|βββββββββββββββββββββββββββββββββββββ | 413/650 [1:04:52<33:30, 8.48s/it]
|
| 1292 |
64%|βββββββββββββββββββββββββββββββββββββ | 414/650 [1:05:00<33:05, 8.41s/it]
|
| 1293 |
64%|βββββββββββββββββββββββββββββββββββββ | 415/650 [1:05:08<32:45, 8.36s/it]
|
| 1294 |
|
| 1295 |
+
|
| 1296 |
64%|ββββββββββββββββββββββββββββοΏ½οΏ½ββββββββ | 415/650 [1:05:08<32:45, 8.36s/it]
|
| 1297 |
64%|βββββββββββββββββββββββββββββββββββββ | 416/650 [1:05:14<30:08, 7.73s/it]
|
| 1298 |
64%|ββββββββββββββββββββββββββββββββββββββ | 417/650 [1:05:25<32:47, 8.45s/it]
|
| 1299 |
64%|ββββββββββββββββββββββββββββββββββββββ | 418/650 [1:05:33<32:25, 8.38s/it]
|
| 1300 |
64%|ββββββββββββββββββββββββββββββββββββββ | 419/650 [1:05:41<32:06, 8.34s/it]
|
| 1301 |
65%|ββββββββββββββββββββββββββββββββββββββ | 420/650 [1:05:49<31:51, 8.31s/it]
|
| 1302 |
|
| 1303 |
+
|
| 1304 |
65%|ββββββββββββββββββββββββββββββββββββββ | 420/650 [1:05:49<31:51, 8.31s/it]
|
| 1305 |
65%|ββββββββββββββββββββββββββββββββββββββ | 421/650 [1:05:58<31:39, 8.30s/it]
|
| 1306 |
65%|ββββββββββββββββββββββββββββββββββββββ | 422/650 [1:06:06<31:28, 8.28s/it]
|
| 1307 |
65%|ββββββββββββββββββββββββββββββββββββββ | 423/650 [1:06:14<31:18, 8.27s/it]
|
| 1308 |
65%|ββββββββββββββββββββββββββββββββββββββ | 424/650 [1:06:22<31:08, 8.27s/it]
|
| 1309 |
65%|ββββββββββββββββββββββββββββββββββββββ | 425/650 [1:06:31<30:58, 8.26s/it]
|
| 1310 |
|
| 1311 |
+
|
| 1312 |
65%|ββββββββββββββββββββββββββββββββββββββ | 425/650 [1:06:31<30:58, 8.26s/it]
|
| 1313 |
66%|ββββββββββββββββββββββββββββββββββββββ | 426/650 [1:06:39<30:49, 8.26s/it]
|
| 1314 |
66%|ββββββββββββββββββββββββββββββββββββββ | 427/650 [1:06:47<30:41, 8.26s/it]
|
| 1315 |
66%|βββββββββββββββββββββββββββββββββββββββ | 428/650 [1:06:55<30:32, 8.25s/it]
|
| 1316 |
66%|βββββββββββββββββββββββββββββββββββββββ | 429/650 [1:07:02<28:10, 7.65s/it]
|
| 1317 |
66%|βββββββββββββββββββββββββββββββββββββββ | 430/650 [1:07:12<30:46, 8.40s/it]
|
| 1318 |
|
| 1319 |
+
|
| 1320 |
66%|βββββββββββββββββββββββββββββββββββββββ | 430/650 [1:07:12<30:46, 8.40s/it]
|
| 1321 |
66%|βββββββββββββββββββββββββββββββββββββββ | 431/650 [1:07:20<30:29, 8.35s/it]
|
| 1322 |
66%|βββββββββββββββββββββββββββββββββββββββ | 432/650 [1:07:28<30:14, 8.32s/it]
|
| 1323 |
67%|βββββββββββββββββββββββββββββββββββββββ | 433/650 [1:07:36<30:01, 8.30s/it]
|
| 1324 |
67%|ββοΏ½οΏ½ββββββββββββββββββββββββββββββββββββ | 434/650 [1:07:45<29:49, 8.29s/it]
|
| 1325 |
67%|βββββββββββββββββββββββββββββββββββββββ | 435/650 [1:07:53<29:38, 8.27s/it]
|
| 1326 |
|
| 1327 |
+
|
| 1328 |
67%|βββββββββββββββββββββββββββββββββββββββ | 435/650 [1:07:53<29:38, 8.27s/it]
|
| 1329 |
67%|βββββββββββββββββββββββββββββββββββββββ | 436/650 [1:08:01<29:29, 8.27s/it]
|
| 1330 |
67%|βββββββββββββββββββββββββββββββββββββββ | 437/650 [1:08:09<29:19, 8.26s/it]
|
| 1331 |
67%|βββββββββββββββββββββββββββββββββββββββ | 438/650 [1:08:18<29:11, 8.26s/it]
|
| 1332 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 439/650 [1:08:26<29:02, 8.26s/it]
|
| 1333 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 440/650 [1:08:34<28:54, 8.26s/it]
|
| 1334 |
|
| 1335 |
+
|
| 1336 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 440/650 [1:08:34<28:54, 8.26s/it]
|
| 1337 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 441/650 [1:08:43<28:46, 8.26s/it]
|
| 1338 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 442/650 [1:08:49<26:33, 7.66s/it]
|
| 1339 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 443/650 [1:08:59<28:59, 8.40s/it]
|
| 1340 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 444/650 [1:09:07<28:41, 8.36s/it]
|
| 1341 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 445/650 [1:09:15<28:26, 8.33s/it]
|
| 1342 |
|
| 1343 |
+
|
| 1344 |
68%|ββββββββββββββββββββββββββββββββββββββββ | 445/650 [1:09:15<28:26, 8.33s/it]
|
| 1345 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 446/650 [1:09:24<28:13, 8.30s/it]
|
| 1346 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 447/650 [1:09:32<28:02, 8.29s/it]
|
| 1347 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 448/650 [1:09:40<27:51, 8.28s/it]
|
| 1348 |
69%|ββββββββββββββββββββββββββββββββββββββββ | 449/650 [1:09:48<27:41, 8.27s/it]
|
| 1349 |
69%|βββββββββββββββββββββββββββββββββββββββββ | 450/650 [1:09:57<27:32, 8.26s/it]
|
| 1350 |
|
| 1351 |
+
|
| 1352 |
69%|βββββββββββββββββββββββββββββββββββββββββ | 450/650 [1:09:57<27:32, 8.26s/it][2026-01-24 14:35:30,194] [INFO] [axolotl.core.trainers.base.evaluate:400] [PID:9359] Running evaluation step...
|
| 1353 |
+
|
| 1354 |
+
|
| 1355 |
0%| | 0/100 [00:00<?, ?it/s][A
|
| 1356 |
+
|
| 1357 |
2%|ββ | 2/100 [00:00<00:25, 3.85it/s][A
|
| 1358 |
+
|
| 1359 |
3%|ββ | 3/100 [00:01<00:35, 2.71it/s][A
|
| 1360 |
+
|
| 1361 |
4%|βββ | 4/100 [00:01<00:40, 2.35it/s][A
|
| 1362 |
+
|
| 1363 |
5%|βββ | 5/100 [00:02<00:56, 1.69it/s][A
|
| 1364 |
+
|
| 1365 |
6%|ββββ | 6/100 [00:02<00:53, 1.76it/s][A
|
| 1366 |
+
|
| 1367 |
7%|βββββ | 7/100 [00:03<00:51, 1.81it/s][A
|
| 1368 |
+
|
| 1369 |
8%|βββββ | 8/100 [00:04<00:50, 1.84it/s][A
|
| 1370 |
+
|
| 1371 |
9%|ββββββ | 9/100 [00:04<00:50, 1.82it/s][A
|
| 1372 |
+
|
| 1373 |
10%|ββββββ | 10/100 [00:05<00:48, 1.85it/s][A
|
| 1374 |
+
|
| 1375 |
11%|βββββββ | 11/100 [00:05<00:47, 1.87it/s][A
|
| 1376 |
+
|
| 1377 |
12%|ββββββββ | 12/100 [00:06<00:46, 1.89it/s][A
|
| 1378 |
+
|
| 1379 |
13%|ββββββββ | 13/100 [00:06<00:46, 1.85it/s][A
|
| 1380 |
+
|
| 1381 |
14%|βββββββββ | 14/100 [00:07<00:45, 1.87it/s][A
|
| 1382 |
+
|
| 1383 |
15%|ββββββββββ | 15/100 [00:07<00:45, 1.89it/s][A
|
| 1384 |
+
|
| 1385 |
16%|ββββββββββ | 16/100 [00:08<00:44, 1.90it/s][A
|
| 1386 |
+
|
| 1387 |
17%|βββββββββββ | 17/100 [00:08<00:44, 1.86it/s][A
|
| 1388 |
+
|
| 1389 |
18%|βββββββββββ | 18/100 [00:09<00:43, 1.88it/s][A
|
| 1390 |
+
|
| 1391 |
19%|ββββββββββββ | 19/100 [00:09<00:42, 1.89it/s][A
|
| 1392 |
+
|
| 1393 |
20%|βββββββββββββ | 20/100 [00:10<00:42, 1.90it/s][A
|
| 1394 |
+
|
| 1395 |
21%|βββββββββββββ | 21/100 [00:10<00:42, 1.86it/s][A
|
| 1396 |
+
|
| 1397 |
22%|ββββββββββββββ | 22/100 [00:11<00:41, 1.88it/s][A
|
| 1398 |
+
|
| 1399 |
23%|ββββββββββββββ | 23/100 [00:12<00:40, 1.89it/s][A
|
| 1400 |
+
|
| 1401 |
24%|βββββββββββββββ | 24/100 [00:12<00:40, 1.90it/s][A
|
| 1402 |
+
|
| 1403 |
25%|ββββββββββββββββ | 25/100 [00:13<00:40, 1.86it/s][A
|
| 1404 |
+
|
| 1405 |
26%|ββββββββββββββββ | 26/100 [00:13<00:39, 1.88it/s][A
|
| 1406 |
+
|
| 1407 |
27%|βββββββββββββββββ | 27/100 [00:14<00:38, 1.89it/s][A
|
| 1408 |
+
|
| 1409 |
28%|βββββββββββββββββ | 28/100 [00:14<00:37, 1.90it/s][A
|
| 1410 |
+
|
| 1411 |
29%|ββββββββββββββββββ | 29/100 [00:15<00:38, 1.86it/s][A
|
| 1412 |
+
|
| 1413 |
30%|βββββββββββββββββββ | 30/100 [00:15<00:37, 1.88it/s][A
|
| 1414 |
+
|
| 1415 |
31%|βββββββββββββββββββ | 31/100 [00:16<00:36, 1.89it/s][A
|
| 1416 |
+
|
| 1417 |
32%|ββββββββββββββββββββ | 32/100 [00:16<00:35, 1.90it/s][A
|
| 1418 |
+
|
| 1419 |
33%|βββββββββββββββββββββ | 33/100 [00:17<00:36, 1.86it/s][A
|
| 1420 |
+
|
| 1421 |
34%|βββββββββββββββββββββ | 34/100 [00:17<00:35, 1.88it/s][A
|
| 1422 |
+
|
| 1423 |
35%|ββββββββββββββββββββββ | 35/100 [00:18<00:34, 1.89it/s][A
|
| 1424 |
+
|
| 1425 |
36%|ββββββββββββββββββββββ | 36/100 [00:18<00:33, 1.90it/s][A
|
| 1426 |
+
|
| 1427 |
37%|βββββββββββββββββββββββ | 37/100 [00:19<00:35, 1.79it/s][A
|
| 1428 |
+
|
| 1429 |
38%|ββββββββββββββββββββββββ | 38/100 [00:19<00:32, 1.90it/s][A
|
| 1430 |
+
|
| 1431 |
39%|ββββββββββββββββββββββββ | 39/100 [00:20<00:31, 1.91it/s][A
|
| 1432 |
+
|
| 1433 |
40%|βββββββββββββββββββββββββ | 40/100 [00:21<00:31, 1.91it/s][A
|
| 1434 |
+
|
| 1435 |
41%|βββββββββββββββββββββββββ | 41/100 [00:21<00:31, 1.87it/s][A
|
| 1436 |
+
|
| 1437 |
42%|ββββββββββββββββββββββββββ | 42/100 [00:22<00:30, 1.89it/s][A
|
| 1438 |
+
|
| 1439 |
43%|βββββββββββββββββββββββββββ | 43/100 [00:22<00:30, 1.89it/s][A
|
| 1440 |
+
|
| 1441 |
44%|βββββββββββββββββββββββββββ | 44/100 [00:23<00:29, 1.90it/s][A
|
| 1442 |
+
|
| 1443 |
45%|ββββββββββββββββββββββββββββ | 45/100 [00:23<00:29, 1.86it/s][A
|
| 1444 |
+
|
| 1445 |
46%|ββββββββββββββββββββββββββββ | 46/100 [00:24<00:28, 1.88it/s][A
|
| 1446 |
+
|
| 1447 |
47%|βββββββββββββββββββββββββββββ | 47/100 [00:24<00:28, 1.89it/s][A
|
| 1448 |
+
|
| 1449 |
48%|ββββββββββββββββββββββββββββββ | 48/100 [00:25<00:27, 1.90it/s][A
|
| 1450 |
+
|
| 1451 |
49%|ββββββββββββββββββββββββββββββ | 49/100 [00:25<00:27, 1.86it/s][A
|
| 1452 |
+
|
| 1453 |
50%|βββββββββββββββββββββββββββββββ | 50/100 [00:26<00:26, 1.88it/s][A
|
| 1454 |
+
|
| 1455 |
51%|βββββββββββββββββββββββββββββββ | 51/100 [00:26<00:25, 1.89it/s][A
|
| 1456 |
+
|
| 1457 |
52%|ββββββββββββββββββββββββββββββββ | 52/100 [00:27<00:25, 1.90it/s][A
|
| 1458 |
+
|
| 1459 |
53%|βββββββββββββββββββββββββββββββββ | 53/100 [00:27<00:25, 1.86it/s][A
|
| 1460 |
+
|
| 1461 |
54%|βββββββββββββββββββββββββββββββββ | 54/100 [00:28<00:24, 1.88it/s][A
|
| 1462 |
+
|
| 1463 |
55%|ββββββββββββββββββββββββββββββββββ | 55/100 [00:29<00:23, 1.89it/s][A
|
| 1464 |
+
|
| 1465 |
56%|βββββββββββββββββββββββββββββββββββ | 56/100 [00:29<00:23, 1.90it/s][A
|
| 1466 |
+
|
| 1467 |
57%|βββββββββββββββββββββββββββββββββββ | 57/100 [00:30<00:23, 1.86it/s][A
|
| 1468 |
+
|
| 1469 |
58%|ββββββββββββββββββββββββββββββββββββ | 58/100 [00:30<00:22, 1.88it/s][A
|
| 1470 |
+
|
| 1471 |
59%|ββββββββββββββββββββββββββββββββββββ | 59/100 [00:31<00:21, 1.89it/s][A
|
| 1472 |
+
|
| 1473 |
60%|βββββββββββββββββββββββββββββββββββββ | 60/100 [00:31<00:21, 1.90it/s][A
|
| 1474 |
+
|
| 1475 |
61%|ββββββββββββββββββββββββββββββββββββββ | 61/100 [00:32<00:20, 1.86it/s][A
|
| 1476 |
+
|
| 1477 |
62%|ββββββββββββββββββββββββββββββββββββββ | 62/100 [00:32<00:20, 1.88it/s][A
|
| 1478 |
+
|
| 1479 |
63%|βββββββββββββββββββββββββββββββββββββββ | 63/100 [00:33<00:19, 1.89it/s][A
|
| 1480 |
+
|
| 1481 |
64%|βββββββββββββββββββββββββββββββββββββββ | 64/100 [00:33<00:18, 1.90it/s][A
|
| 1482 |
+
|
| 1483 |
65%|ββββββββββββββββββββββββββββββββββββββββ | 65/100 [00:34<00:18, 1.86it/s][A
|
| 1484 |
+
|
| 1485 |
66%|βββββββββββββββββββββββββββββββββββββββββ | 66/100 [00:34<00:18, 1.88it/s][A
|
| 1486 |
+
|
| 1487 |
67%|βββββββββββββοΏ½οΏ½οΏ½βββββββββββββββββββββββββββ | 67/100 [00:35<00:17, 1.89it/s][A
|
| 1488 |
+
|
| 1489 |
68%|ββββββββββββββββββββββββββββββββββββββββββ | 68/100 [00:35<00:16, 1.90it/s][A
|
| 1490 |
+
|
| 1491 |
69%|ββββββββββββββββββββββββββββββββββββββββββ | 69/100 [00:36<00:16, 1.86it/s][A
|
| 1492 |
+
|
| 1493 |
70%|βββββββββββββββββββββββββββββββββββββββββββ | 70/100 [00:36<00:15, 1.88it/s][A
|
| 1494 |
+
|
| 1495 |
71%|ββββββββββββββββββββββββββββββββββββββββββββ | 71/100 [00:37<00:15, 1.89it/s][A
|
| 1496 |
+
|
| 1497 |
72%|ββββββββββββββββββββββββββββββββββββββββββββ | 72/100 [00:38<00:14, 1.90it/s][A
|
| 1498 |
+
|
| 1499 |
73%|βββββββββββββββββββββββββββββββββββββββββββββ | 73/100 [00:38<00:14, 1.86it/s][A
|
| 1500 |
+
|
| 1501 |
74%|ββββββββββββββββββββββββββββββββββββββββββββββ | 74/100 [00:39<00:13, 1.88it/s][A
|
| 1502 |
+
|
| 1503 |
75%|ββββββββββββββββββββββββββββββββββββββββββββββ | 75/100 [00:39<00:13, 1.89it/s][A
|
| 1504 |
+
|
| 1505 |
76%|βββββββββββββββββββββββββββββββββββββββββββββββ | 76/100 [00:40<00:12, 1.90it/s][A
|
| 1506 |
+
|
| 1507 |
77%|βββββββββββββββββββββββββββββββββββββββββββββββ | 77/100 [00:40<00:12, 1.86it/s][A
|
| 1508 |
+
|
| 1509 |
78%|ββββββββββββββββββββββββββββββββββββββββββββββββ | 78/100 [00:41<00:11, 1.88it/s][A
|
| 1510 |
+
|
| 1511 |
79%|βββββββββββββββββββββββββββββββββββββββββββββββββ | 79/100 [00:41<00:11, 1.89it/s][A
|
| 1512 |
+
|
| 1513 |
80%|βββββββββββββββββββββββββββββββββββββββββββββββββ | 80/100 [00:42<00:10, 1.90it/s][A
|
| 1514 |
+
|
| 1515 |
81%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 81/100 [00:42<00:10, 1.86it/s][A
|
| 1516 |
+
|
| 1517 |
82%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 82/100 [00:43<00:09, 1.88it/s][A
|
| 1518 |
+
|
| 1519 |
83%|βββββββββββββββββββββββββββββββββββββββββββββββββββ | 83/100 [00:43<00:08, 1.89it/s][A
|
| 1520 |
+
|
| 1521 |
84%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 84/100 [00:44<00:08, 1.90it/s][A
|
| 1522 |
+
|
| 1523 |
85%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 85/100 [00:44<00:08, 1.86it/s][A
|
| 1524 |
+
|
| 1525 |
86%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 86/100 [00:45<00:07, 1.88it/s][A
|
| 1526 |
+
|
| 1527 |
87%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 87/100 [00:46<00:06, 1.89it/s][A
|
| 1528 |
+
|
| 1529 |
88%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 88/100 [00:46<00:06, 1.90it/s][A
|
| 1530 |
+
|
| 1531 |
89%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 89/100 [00:47<00:05, 1.86it/s][A
|
| 1532 |
+
|
| 1533 |
90%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 90/100 [00:47<00:05, 1.88it/s][A
|
| 1534 |
+
|
| 1535 |
91%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 91/100 [00:48<00:04, 1.89it/s][A
|
| 1536 |
+
|
| 1537 |
92%|βββββββββββββββββββββββββββββββββββοΏ½οΏ½ββββββββββββββββββββ | 92/100 [00:48<00:04, 1.90it/s][A
|
| 1538 |
+
|
| 1539 |
93%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 93/100 [00:49<00:03, 1.86it/s][A
|
| 1540 |
+
|
| 1541 |
94%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 94/100 [00:49<00:03, 1.88it/s][A
|
| 1542 |
+
|
| 1543 |
95%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 95/100 [00:50<00:02, 1.89it/s][A
|
| 1544 |
+
|
| 1545 |
96%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 96/100 [00:50<00:02, 1.90it/s][A
|
| 1546 |
+
|
| 1547 |
97%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 97/100 [00:51<00:01, 1.86it/s][A
|
| 1548 |
+
|
| 1549 |
98%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 98/100 [00:51<00:01, 1.88it/s][A
|
| 1550 |
+
|
| 1551 |
99%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ| 99/100 [00:52<00:00, 1.89it/s][A
|
| 1552 |
+
|
| 1553 |
|
| 1554 |
+
|
| 1555 |
|
| 1556 |
+
|
| 1557 |
69%|βββββββββββββββββββββββββββββββββββββββββ | 450/650 [1:10:51<27:32, 8.26s/it]
|
| 1558 |
+
|
| 1559 |
+
|
| 1560 |
[A
|
| 1561 |
69%|βββββββββββββββββββββββββββββββββββββββ | 451/650 [1:10:59<1:21:14, 24.49s/it]
|
| 1562 |
70%|βββββββββββββββββββββββββββββββββββββββ | 452/650 [1:11:07<1:04:45, 19.62s/it]
|
| 1563 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 453/650 [1:11:16<53:13, 16.21s/it]
|
| 1564 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 454/650 [1:11:24<45:08, 13.82s/it]
|
| 1565 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 455/650 [1:11:30<37:31, 11.55s/it]
|
| 1566 |
|
| 1567 |
+
|
| 1568 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 455/650 [1:11:30<37:31, 11.55s/it]
|
| 1569 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 456/650 [1:11:40<35:56, 11.11s/it]
|
| 1570 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 457/650 [1:11:48<32:59, 10.26s/it]
|
| 1571 |
70%|βββββββββββββββββββββββββββββββββββββββββ | 458/650 [1:11:57<30:53, 9.65s/it]
|
| 1572 |
71%|βββββββββββββββββββββββββββββββββββββββββ | 459/650 [1:12:05<29:23, 9.23s/it]
|
| 1573 |
71%|βββββββββββββββββββββββββββββββββββββββββ | 460/650 [1:12:13<28:17, 8.94s/it]
|
| 1574 |
|
| 1575 |
+
|
| 1576 |
71%|βββββββββββββββββββββββββββββββββββββββββ | 460/650 [1:12:13<28:17, 8.94s/it]
|
| 1577 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 461/650 [1:12:21<27:29, 8.73s/it]
|
| 1578 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 462/650 [1:12:30<26:54, 8.59s/it]
|
| 1579 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 463/650 [1:12:38<26:26, 8.48s/it]
|
| 1580 |
71%|ββββββββββββββββββββββββββββββββββββββββββ | 464/650 [1:12:46<26:04, 8.41s/it]
|
| 1581 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 465/650 [1:12:54<25:46, 8.36s/it]
|
| 1582 |
|
| 1583 |
+
|
| 1584 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 465/650 [1:12:54<25:46, 8.36s/it]
|
| 1585 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 466/650 [1:13:03<25:31, 8.32s/it]
|
| 1586 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 467/650 [1:13:11<25:18, 8.30s/it]
|
| 1587 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 468/650 [1:13:17<23:18, 7.68s/it]
|
| 1588 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 469/650 [1:13:27<25:25, 8.43s/it]
|
| 1589 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 470/650 [1:13:35<25:07, 8.37s/it]
|
| 1590 |
|
| 1591 |
+
|
| 1592 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 470/650 [1:13:35<25:07, 8.37s/it]
|
| 1593 |
72%|ββββββββββββββββββββββββββββββββββββββββββ | 471/650 [1:13:44<24:51, 8.33s/it]
|
| 1594 |
73%|ββββββββββββββββββββββββββββββββββββββββββ | 472/650 [1:13:52<24:38, 8.30s/it]
|
| 1595 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 473/650 [1:14:00<24:27, 8.29s/it]
|
| 1596 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 474/650 [1:14:08<24:16, 8.27s/it]
|
| 1597 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 475/650 [1:14:17<24:07, 8.27s/it]
|
| 1598 |
|
| 1599 |
+
|
| 1600 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 475/650 [1:14:17<24:07, 8.27s/it]
|
| 1601 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 476/650 [1:14:25<23:57, 8.26s/it]
|
| 1602 |
73%|βββββββββββββββββββββββββββββββββββββββββββ | 477/650 [1:14:33<23:48, 8.26s/it]
|
| 1603 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 478/650 [1:14:41<23:39, 8.25s/it]
|
| 1604 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 479/650 [1:14:50<23:30, 8.25s/it]
|
| 1605 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 480/650 [1:14:58<23:21, 8.24s/it]
|
| 1606 |
|
| 1607 |
+
|
| 1608 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 480/650 [1:14:58<23:21, 8.24s/it]
|
| 1609 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 481/650 [1:15:04<21:31, 7.64s/it]
|
| 1610 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 482/650 [1:15:14<23:28, 8.38s/it]
|
| 1611 |
74%|βββββββββββββββββββββββββββββββββββββββββββ | 483/650 [1:15:23<23:13, 8.34s/it]
|
| 1612 |
74%|ββββββββββββββββββββββββββββββββββββββββββββ | 484/650 [1:15:31<22:59, 8.31s/it]
|
| 1613 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 485/650 [1:15:39<22:47, 8.29s/it]
|
| 1614 |
|
| 1615 |
+
|
| 1616 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 485/650 [1:15:39<22:47, 8.29s/it]
|
| 1617 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 486/650 [1:15:47<22:37, 8.28s/it]
|
| 1618 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 487/650 [1:15:55<22:27, 8.27s/it]
|
| 1619 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 488/650 [1:16:04<22:17, 8.26s/it]
|
| 1620 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 489/650 [1:16:12<22:09, 8.25s/it]
|
| 1621 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 490/650 [1:16:20<22:00, 8.25s/it]
|
| 1622 |
|
| 1623 |
+
|
| 1624 |
75%|ββββββββββββββββββββββββββββββββββββββββββββ | 490/650 [1:16:20<22:00, 8.25s/it]
|
| 1625 |
76%|ββββββββββββββββββοΏ½οΏ½οΏ½βββββββββββββββββββββββββ | 491/650 [1:16:28<21:51, 8.25s/it]
|
| 1626 |
76%|ββββββββββββββββββββββββββββββββββββββββββββ | 492/650 [1:16:37<21:42, 8.24s/it]
|
| 1627 |
76%|ββββββββββββββββββββββββββββββββββββββββββββ | 493/650 [1:16:45<21:34, 8.25s/it]
|
| 1628 |
76%|ββββββββββββββββββββββββββββββββββββββββββββ | 494/650 [1:16:51<19:52, 7.65s/it]
|
| 1629 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 495/650 [1:17:01<21:41, 8.40s/it]
|
| 1630 |
|
| 1631 |
+
|
| 1632 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 495/650 [1:17:01<21:41, 8.40s/it]
|
| 1633 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 496/650 [1:17:10<21:26, 8.35s/it]
|
| 1634 |
76%|βββββββββββββββββββββββββββββββββββββββββββββ | 497/650 [1:17:18<21:12, 8.32s/it]
|
| 1635 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 498/650 [1:17:26<21:00, 8.29s/it]
|
| 1636 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 499/650 [1:17:34<20:49, 8.28s/it]
|
| 1637 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 500/650 [1:17:43<20:39, 8.27s/it]
|
| 1638 |
|
| 1639 |
+
|
| 1640 |
77%|βββββββββββββββββββββββββββββββββββββββββββββ | 500/650 [1:17:43<20:39, 8.27s/it][2026-01-24 14:43:16,073] [INFO] [axolotl.core.trainers.base.evaluate:400] [PID:9359] Running evaluation step...
|
| 1641 |
+
|
| 1642 |
+
|
| 1643 |
0%| | 0/100 [00:00<?, ?it/s][A
|
| 1644 |
+
|
| 1645 |
2%|ββ | 2/100 [00:00<00:25, 3.86it/s][A
|
| 1646 |
+
|
| 1647 |
3%|ββ | 3/100 [00:01<00:35, 2.72it/s][A
|
| 1648 |
+
|
| 1649 |
4%|βββ | 4/100 [00:01<00:40, 2.35it/s][A
|
| 1650 |
+
|
| 1651 |
5%|βββ | 5/100 [00:02<00:54, 1.75it/s][A
|
| 1652 |
+
|
| 1653 |
6%|ββββ | 6/100 [00:02<00:52, 1.81it/s][A
|
| 1654 |
+
|
| 1655 |
7%|βββββ | 7/100 [00:03<00:50, 1.84it/s][A
|
| 1656 |
+
|
| 1657 |
8%|βββββ | 8/100 [00:03<00:49, 1.87it/s][A
|
| 1658 |
+
|
| 1659 |
9%|ββββββ | 9/100 [00:04<00:49, 1.84it/s][A
|
| 1660 |
+
|
| 1661 |
10%|ββββββ | 10/100 [00:05<00:48, 1.87it/s][A
|
| 1662 |
+
|
| 1663 |
11%|βββββββ | 11/100 [00:05<00:47, 1.88it/s][A
|
| 1664 |
+
|
| 1665 |
12%|ββββββββ | 12/100 [00:06<00:46, 1.89it/s][A
|
| 1666 |
+
|
| 1667 |
13%|ββββββββ | 13/100 [00:06<00:46, 1.86it/s][A
|
| 1668 |
+
|
| 1669 |
14%|βββββββββ | 14/100 [00:07<00:45, 1.88it/s][A
|
| 1670 |
+
|
| 1671 |
15%|ββββββββββ | 15/100 [00:07<00:44, 1.89it/s][A
|
| 1672 |
+
|
| 1673 |
16%|ββββββββββ | 16/100 [00:08<00:44, 1.90it/s][A
|
| 1674 |
+
|
| 1675 |
17%|βββββββββββ | 17/100 [00:08<00:44, 1.86it/s][A
|
| 1676 |
+
|
| 1677 |
18%|βββββββββββ | 18/100 [00:09<00:43, 1.89it/s][A
|
| 1678 |
+
|
| 1679 |
19%|ββββββββββββ | 19/100 [00:09<00:42, 1.90it/s][A
|
| 1680 |
+
|
| 1681 |
20%|βββββββββββββ | 20/100 [00:10<00:42, 1.90it/s][A
|
| 1682 |
+
|
| 1683 |
21%|βββββββββββββ | 21/100 [00:10<00:42, 1.86it/s][A
|
| 1684 |
+
|
| 1685 |
22%|ββββββββββββββ | 22/100 [00:11<00:41, 1.88it/s][A
|
| 1686 |
+
|
| 1687 |
23%|ββββββββββββββ | 23/100 [00:11<00:40, 1.89it/s][A
|
| 1688 |
+
|
| 1689 |
24%|βββββββββββββββ | 24/100 [00:12<00:39, 1.90it/s][A
|
| 1690 |
+
|
| 1691 |
25%|ββββββββββββββββ | 25/100 [00:13<00:40, 1.86it/s][A
|
| 1692 |
+
|
| 1693 |
26%|ββββββββββββββββ | 26/100 [00:13<00:39, 1.88it/s][A
|
| 1694 |
+
|
| 1695 |
27%|βββββββββββββββββ | 27/100 [00:14<00:38, 1.89it/s][A
|
| 1696 |
+
|
| 1697 |
28%|βββββββββββββββββ | 28/100 [00:14<00:37, 1.90it/s][A
|
| 1698 |
+
|
| 1699 |
29%|ββββββββββββββββββ | 29/100 [00:15<00:38, 1.86it/s][A
|
| 1700 |
+
|
| 1701 |
30%|βββββββββββββββββββ | 30/100 [00:15<00:37, 1.88it/s][A
|
| 1702 |
+
|
| 1703 |
31%|βββββββββββββββββββ | 31/100 [00:16<00:36, 1.89it/s][A
|
| 1704 |
+
|
| 1705 |
32%|ββββββββββββββββββββ | 32/100 [00:16<00:35, 1.90it/s][A
|
| 1706 |
+
|
| 1707 |
33%|βββββββββββββββββββββ | 33/100 [00:17<00:35, 1.86it/s][A
|
| 1708 |
+
|
| 1709 |
34%|βββββββββββββββββββββ | 34/100 [00:17<00:35, 1.88it/s][A
|
| 1710 |
+
|
| 1711 |
35%|ββββββββββββββββββββββ | 35/100 [00:18<00:34, 1.89it/s][A
|
| 1712 |
+
|
| 1713 |
36%|ββββββββββββββββββββββ | 36/100 [00:18<00:33, 1.90it/s][A
|
| 1714 |
+
|
| 1715 |
37%|βββββββββββββββββββββββ | 37/100 [00:19<00:33, 1.86it/s][A
|
| 1716 |
+
|
| 1717 |
38%|ββββββββββββββββββββββββ | 38/100 [00:19<00:32, 1.88it/s][A
|
| 1718 |
+
|
| 1719 |
39%|ββββββββββββββββββββββββ | 39/100 [00:20<00:32, 1.89it/s][A
|
| 1720 |
+
|
| 1721 |
40%|βββββββββββββββββββββββββ | 40/100 [00:20<00:31, 1.90it/s][A
|
| 1722 |
+
|
| 1723 |
41%|βββββββββββββββββββββββββ | 41/100 [00:21<00:31, 1.86it/s][A
|
| 1724 |
+
|
| 1725 |
42%|ββββββββββββββββββββββββββ | 42/100 [00:22<00:30, 1.88it/s][A
|
| 1726 |
+
|
| 1727 |
43%|βββββββββββββββββββββββββββ | 43/100 [00:22<00:30, 1.89it/s][A
|
| 1728 |
+
|
| 1729 |
44%|βββββββββββββββββββββββββββ | 44/100 [00:23<00:29, 1.90it/s][A
|
| 1730 |
+
|
| 1731 |
45%|ββββββββββββββββββββββββββββ | 45/100 [00:23<00:29, 1.86it/s][A
|
| 1732 |
+
|
| 1733 |
46%|ββββββββββββββββββββββββββββ | 46/100 [00:24<00:28, 1.88it/s][A
|
| 1734 |
+
|
| 1735 |
47%|βββββββββββββββββββββββββββββ | 47/100 [00:24<00:28, 1.89it/s][A
|
| 1736 |
+
|
| 1737 |
48%|ββββββββββββββββββββββββββββββ | 48/100 [00:25<00:27, 1.90it/s][A
|
| 1738 |
+
|
| 1739 |
49%|ββββββββββββββββββββββββββββββ | 49/100 [00:25<00:27, 1.86it/s][A
|
| 1740 |
+
|
| 1741 |
50%|βββββββββββββββββββββββββββββββ | 50/100 [00:26<00:26, 1.88it/s][A
|
| 1742 |
+
|
| 1743 |
51%|βββββββββββββββββββββββββββββββ | 51/100 [00:26<00:25, 1.89it/s][A
|
| 1744 |
+
|
| 1745 |
52%|βββββοΏ½οΏ½ββββββββββββββββββββββββββ | 52/100 [00:27<00:25, 1.90it/s][A
|
| 1746 |
+
|
| 1747 |
53%|βββββββββββββββββββββββββββββββββ | 53/100 [00:27<00:25, 1.86it/s][A
|
| 1748 |
+
|
| 1749 |
54%|βββββββββββββββββββββββββββββββββ | 54/100 [00:28<00:24, 1.88it/s][A
|
| 1750 |
+
|
| 1751 |
55%|ββββββββββββββββββββββββββββββββββ | 55/100 [00:28<00:23, 1.89it/s][A
|
| 1752 |
+
|
| 1753 |
56%|βββββββββββββββββββββββββββββββββββ | 56/100 [00:29<00:23, 1.90it/s][A
|
| 1754 |
+
|
| 1755 |
57%|βββββββββββββββββββββββββββββββββββ | 57/100 [00:29<00:23, 1.86it/s][A
|
| 1756 |
+
|
| 1757 |
58%|ββββββββββββββββββββββββββββββββββββ | 58/100 [00:30<00:22, 1.88it/s][A
|
| 1758 |
+
|
| 1759 |
59%|ββββββββββββββββββββββββββββββββββββ | 59/100 [00:31<00:21, 1.89it/s][A
|
| 1760 |
+
|
| 1761 |
60%|βββββββββββββββββββββββββββββββββββββ | 60/100 [00:31<00:21, 1.90it/s][A
|
| 1762 |
+
|
| 1763 |
61%|ββββββββββββββββββββββββββββββββββββββ | 61/100 [00:32<00:20, 1.86it/s][A
|
| 1764 |
+
|
| 1765 |
62%|ββββββββββββββββββββββββββββββββββββββ | 62/100 [00:32<00:20, 1.88it/s][A
|
| 1766 |
+
|
| 1767 |
63%|βββββββββββββββββββββββββββββββββββββββ | 63/100 [00:33<00:19, 1.89it/s][A
|
| 1768 |
+
|
| 1769 |
64%|βββββββββββββββββββββββββββββββββββββββ | 64/100 [00:33<00:18, 1.90it/s][A
|
| 1770 |
+
|
| 1771 |
65%|ββββββββββββββββββββββββββββββββββββββββ | 65/100 [00:34<00:18, 1.86it/s][A
|
| 1772 |
+
|
| 1773 |
66%|βββββββββββββββββββββββββββββββββββββββββ | 66/100 [00:34<00:18, 1.88it/s][A
|
| 1774 |
+
|
| 1775 |
67%|βββββββββββββββββββββββββββββββββββββββββ | 67/100 [00:35<00:17, 1.89it/s][A
|
| 1776 |
+
|
| 1777 |
68%|ββββββββββββββββββββββββββββββββββββββββββ | 68/100 [00:35<00:16, 1.90it/s][A
|
| 1778 |
+
|
| 1779 |
69%|ββββββββββββββββββββββββββββββββββββββββββ | 69/100 [00:36<00:16, 1.86it/s][A
|
| 1780 |
+
|
| 1781 |
70%|βββββββββββββββββββββββββββββββββββββββββββ | 70/100 [00:36<00:15, 1.88it/s][A
|
| 1782 |
+
|
| 1783 |
71%|ββββββββββββββββββββββββββββββββββββββββββββ | 71/100 [00:37<00:15, 1.89it/s][A
|
| 1784 |
+
|
| 1785 |
72%|ββββββββββββββββββββββββββββββββββββββββββββ | 72/100 [00:37<00:14, 1.90it/s][A
|
| 1786 |
+
|
| 1787 |
73%|βββββββββββββββββββββββββββββββββββββββββββββ | 73/100 [00:38<00:14, 1.86it/s][A
|
| 1788 |
+
|
| 1789 |
74%|ββββββββββββββββββββββββββββββββββββββββββββββ | 74/100 [00:39<00:13, 1.88it/s][A
|
| 1790 |
+
|
| 1791 |
75%|ββββββββββββββββββββββββββββββββββββββββββββββ | 75/100 [00:39<00:13, 1.89it/s][A
|
| 1792 |
+
|
| 1793 |
76%|βββββββββββββββββββββββββββββββββββββββββββββββ | 76/100 [00:40<00:12, 1.90it/s][A
|
| 1794 |
+
|
| 1795 |
77%|βββββββββββββββββββββββββββββββββββββββββββββββ | 77/100 [00:40<00:12, 1.86it/s][A
|
| 1796 |
+
|
| 1797 |
78%|ββββββββββββββββββββββββββββββββββββββββββββββββ | 78/100 [00:41<00:11, 1.88it/s][A
|
| 1798 |
+
|
| 1799 |
79%|ββββββββββββββββββββββββββββββββββββββββββββββοΏ½οΏ½ββ | 79/100 [00:41<00:11, 1.89it/s][A
|
| 1800 |
+
|
| 1801 |
80%|βββββββββββββββββββββββββββββββββββββββββββββββββ | 80/100 [00:42<00:10, 1.90it/s][A
|
| 1802 |
+
|
| 1803 |
81%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 81/100 [00:42<00:10, 1.86it/s][A
|
| 1804 |
+
|
| 1805 |
82%|ββββββββββββββββββββββββββββββββββββββββββββββββββ | 82/100 [00:43<00:09, 1.88it/s][A
|
| 1806 |
+
|
| 1807 |
83%|βββββββββββββββββββββββββββββββββββββββββββββββββββ | 83/100 [00:43<00:08, 1.89it/s][A
|
| 1808 |
+
|
| 1809 |
84%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 84/100 [00:44<00:08, 1.90it/s][A
|
| 1810 |
+
|
| 1811 |
85%|ββββββββββββββββββββββββββββββββββββββββββββββββββββ | 85/100 [00:44<00:08, 1.86it/s][A
|
| 1812 |
+
|
| 1813 |
86%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 86/100 [00:45<00:07, 1.88it/s][A
|
| 1814 |
+
|
| 1815 |
87%|βββββββββββββββββββββββββββββββββββββββββββββββββββββ | 87/100 [00:45<00:06, 1.89it/s][A
|
| 1816 |
+
|
| 1817 |
88%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 88/100 [00:46<00:06, 1.90it/s][A
|
| 1818 |
+
|
| 1819 |
89%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 89/100 [00:47<00:05, 1.86it/s][A
|
| 1820 |
+
|
| 1821 |
90%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 90/100 [00:47<00:05, 1.88it/s][A
|
| 1822 |
+
|
| 1823 |
91%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 91/100 [00:48<00:04, 1.89it/s][A
|
| 1824 |
+
|
| 1825 |
92%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 92/100 [00:48<00:04, 1.90it/s][A
|
| 1826 |
+
|
| 1827 |
93%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 93/100 [00:49<00:03, 1.86it/s][A
|
| 1828 |
+
|
| 1829 |
94%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 94/100 [00:49<00:03, 1.88it/s][A
|
| 1830 |
+
|
| 1831 |
95%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 95/100 [00:50<00:02, 1.89it/s][A
|
| 1832 |
+
|
| 1833 |
96%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 96/100 [00:50<00:02, 1.90it/s][A
|
| 1834 |
+
|
| 1835 |
97%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 97/100 [00:51<00:01, 1.86it/s][A
|
| 1836 |
+
|
| 1837 |
98%|ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ | 98/100 [00:51<00:01, 1.88it/s][A
|
| 1838 |
+
|
| 1839 |
99%|βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ| 99/100 [00:52<00:00, 1.89it/s][A
|
| 1840 |
+
|
| 1841 |
|
| 1842 |
+
|
| 1843 |
|
| 1844 |
+
|
| 1845 |
77%|ββββββοΏ½οΏ½οΏ½ββββββββββββββββββββββββββββββββββββββ | 500/650 [1:18:37<20:39, 8.27s/it]
|
| 1846 |
+
|
| 1847 |
+
|
| 1848 |
[A[2026-01-24 14:44:10,048] [INFO] [axolotl.core.trainers.base._save:721] [PID:9359] Saving model checkpoint to ./phi4_african_history_lora_out/checkpoint-500
|