Training in progress, step 7600
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5f334f5afe449a3011d215337373b7326b2460b08dcc4f033940513e27c6f9a
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62ec755d06127e628b922395015710ab55c9ca048e27538356b0e16a409e1db4
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c6b54065f4695921ea58283c3f620f2e7ac4cab716f4a5a8a9b0603eff88bfdf
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:736de5030acda2b7dbb38923f822e5d5b41450ab6cd1cbaba89bd495fd8ea864
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -1504,3 +1504,31 @@
|
|
| 1504 |
{"current_steps": 7450, "total_steps": 9625, "loss": 0.1639, "lr": 5.911823029029531e-06, "epoch": 5.4183339396144055, "percentage": 77.4, "elapsed_time": "1:43:00", "remaining_time": "0:30:04"}
|
| 1505 |
{"current_steps": 7455, "total_steps": 9625, "loss": 0.157, "lr": 5.8861029031564185e-06, "epoch": 5.421971626045835, "percentage": 77.45, "elapsed_time": "1:45:55", "remaining_time": "0:30:49"}
|
| 1506 |
{"current_steps": 7460, "total_steps": 9625, "loss": 0.1584, "lr": 5.860429191414232e-06, "epoch": 5.425609312477264, "percentage": 77.51, "elapsed_time": "1:48:33", "remaining_time": "0:31:30"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1504 |
{"current_steps": 7450, "total_steps": 9625, "loss": 0.1639, "lr": 5.911823029029531e-06, "epoch": 5.4183339396144055, "percentage": 77.4, "elapsed_time": "1:43:00", "remaining_time": "0:30:04"}
|
| 1505 |
{"current_steps": 7455, "total_steps": 9625, "loss": 0.157, "lr": 5.8861029031564185e-06, "epoch": 5.421971626045835, "percentage": 77.45, "elapsed_time": "1:45:55", "remaining_time": "0:30:49"}
|
| 1506 |
{"current_steps": 7460, "total_steps": 9625, "loss": 0.1584, "lr": 5.860429191414232e-06, "epoch": 5.425609312477264, "percentage": 77.51, "elapsed_time": "1:48:33", "remaining_time": "0:31:30"}
|
| 1507 |
+
{"current_steps": 7465, "total_steps": 9625, "loss": 0.1663, "lr": 5.834801978232019e-06, "epoch": 5.429246998908694, "percentage": 77.56, "elapsed_time": "1:51:15", "remaining_time": "0:32:11"}
|
| 1508 |
+
{"current_steps": 7470, "total_steps": 9625, "loss": 0.1589, "lr": 5.809221347885929e-06, "epoch": 5.432884685340124, "percentage": 77.61, "elapsed_time": "1:54:04", "remaining_time": "0:32:54"}
|
| 1509 |
+
{"current_steps": 7475, "total_steps": 9625, "loss": 0.1661, "lr": 5.7836873844989195e-06, "epoch": 5.436522371771553, "percentage": 77.66, "elapsed_time": "1:57:03", "remaining_time": "0:33:40"}
|
| 1510 |
+
{"current_steps": 7480, "total_steps": 9625, "loss": 0.1754, "lr": 5.758200172040484e-06, "epoch": 5.4401600582029825, "percentage": 77.71, "elapsed_time": "1:59:51", "remaining_time": "0:34:22"}
|
| 1511 |
+
{"current_steps": 7485, "total_steps": 9625, "loss": 0.1473, "lr": 5.732759794326355e-06, "epoch": 5.443797744634413, "percentage": 77.77, "elapsed_time": "2:02:13", "remaining_time": "0:34:56"}
|
| 1512 |
+
{"current_steps": 7490, "total_steps": 9625, "loss": 0.1499, "lr": 5.707366335018267e-06, "epoch": 5.447435431065842, "percentage": 77.82, "elapsed_time": "2:05:07", "remaining_time": "0:35:39"}
|
| 1513 |
+
{"current_steps": 7495, "total_steps": 9625, "loss": 0.1587, "lr": 5.682019877623666e-06, "epoch": 5.4510731174972715, "percentage": 77.87, "elapsed_time": "2:08:01", "remaining_time": "0:36:22"}
|
| 1514 |
+
{"current_steps": 7500, "total_steps": 9625, "loss": 0.1574, "lr": 5.656720505495399e-06, "epoch": 5.454710803928702, "percentage": 77.92, "elapsed_time": "2:10:48", "remaining_time": "0:37:03"}
|
| 1515 |
+
{"current_steps": 7505, "total_steps": 9625, "loss": 0.1639, "lr": 5.631468301831509e-06, "epoch": 5.458348490360131, "percentage": 77.97, "elapsed_time": "2:13:42", "remaining_time": "0:37:46"}
|
| 1516 |
+
{"current_steps": 7510, "total_steps": 9625, "loss": 0.1565, "lr": 5.606263349674894e-06, "epoch": 5.4619861767915605, "percentage": 78.03, "elapsed_time": "2:16:46", "remaining_time": "0:38:31"}
|
| 1517 |
+
{"current_steps": 7515, "total_steps": 9625, "loss": 0.1501, "lr": 5.581105731913079e-06, "epoch": 5.46562386322299, "percentage": 78.08, "elapsed_time": "2:19:46", "remaining_time": "0:39:14"}
|
| 1518 |
+
{"current_steps": 7520, "total_steps": 9625, "loss": 0.14, "lr": 5.555995531277931e-06, "epoch": 5.46926154965442, "percentage": 78.13, "elapsed_time": "2:22:48", "remaining_time": "0:39:58"}
|
| 1519 |
+
{"current_steps": 7525, "total_steps": 9625, "loss": 0.1386, "lr": 5.530932830345368e-06, "epoch": 5.4728992360858495, "percentage": 78.18, "elapsed_time": "2:25:39", "remaining_time": "0:40:38"}
|
| 1520 |
+
{"current_steps": 7530, "total_steps": 9625, "loss": 0.1635, "lr": 5.50591771153512e-06, "epoch": 5.476536922517279, "percentage": 78.23, "elapsed_time": "2:28:28", "remaining_time": "0:41:18"}
|
| 1521 |
+
{"current_steps": 7535, "total_steps": 9625, "loss": 0.1483, "lr": 5.480950257110424e-06, "epoch": 5.480174608948708, "percentage": 78.29, "elapsed_time": "2:30:47", "remaining_time": "0:41:49"}
|
| 1522 |
+
{"current_steps": 7540, "total_steps": 9625, "loss": 0.1654, "lr": 5.4560305491777885e-06, "epoch": 5.4838122953801385, "percentage": 78.34, "elapsed_time": "2:33:34", "remaining_time": "0:42:28"}
|
| 1523 |
+
{"current_steps": 7545, "total_steps": 9625, "loss": 0.1709, "lr": 5.431158669686696e-06, "epoch": 5.487449981811568, "percentage": 78.39, "elapsed_time": "2:36:32", "remaining_time": "0:43:09"}
|
| 1524 |
+
{"current_steps": 7550, "total_steps": 9625, "loss": 0.1685, "lr": 5.4063347004293495e-06, "epoch": 5.491087668242997, "percentage": 78.44, "elapsed_time": "2:39:25", "remaining_time": "0:43:48"}
|
| 1525 |
+
{"current_steps": 7555, "total_steps": 9625, "loss": 0.1593, "lr": 5.381558723040388e-06, "epoch": 5.4947253546744275, "percentage": 78.49, "elapsed_time": "2:42:21", "remaining_time": "0:44:29"}
|
| 1526 |
+
{"current_steps": 7560, "total_steps": 9625, "loss": 0.1683, "lr": 5.356830818996621e-06, "epoch": 5.498363041105857, "percentage": 78.55, "elapsed_time": "2:45:20", "remaining_time": "0:45:09"}
|
| 1527 |
+
{"current_steps": 7565, "total_steps": 9625, "loss": 0.1602, "lr": 5.332151069616797e-06, "epoch": 5.502000727537286, "percentage": 78.6, "elapsed_time": "2:48:22", "remaining_time": "0:45:50"}
|
| 1528 |
+
{"current_steps": 7570, "total_steps": 9625, "loss": 0.164, "lr": 5.307519556061276e-06, "epoch": 5.505638413968716, "percentage": 78.65, "elapsed_time": "2:51:20", "remaining_time": "0:46:30"}
|
| 1529 |
+
{"current_steps": 7575, "total_steps": 9625, "loss": 0.1639, "lr": 5.2829363593318075e-06, "epoch": 5.509276100400146, "percentage": 78.7, "elapsed_time": "2:54:22", "remaining_time": "0:47:11"}
|
| 1530 |
+
{"current_steps": 7580, "total_steps": 9625, "loss": 0.1668, "lr": 5.258401560271238e-06, "epoch": 5.512913786831575, "percentage": 78.75, "elapsed_time": "2:57:18", "remaining_time": "0:47:50"}
|
| 1531 |
+
{"current_steps": 7585, "total_steps": 9625, "loss": 0.162, "lr": 5.2339152395632675e-06, "epoch": 5.5165514732630045, "percentage": 78.81, "elapsed_time": "3:00:00", "remaining_time": "0:48:24"}
|
| 1532 |
+
{"current_steps": 7590, "total_steps": 9625, "loss": 0.1609, "lr": 5.209477477732172e-06, "epoch": 5.520189159694434, "percentage": 78.86, "elapsed_time": "3:02:43", "remaining_time": "0:48:59"}
|
| 1533 |
+
{"current_steps": 7595, "total_steps": 9625, "loss": 0.1276, "lr": 5.185088355142529e-06, "epoch": 5.523826846125864, "percentage": 78.91, "elapsed_time": "3:04:41", "remaining_time": "0:49:21"}
|
| 1534 |
+
{"current_steps": 7600, "total_steps": 9625, "loss": 0.1633, "lr": 5.160747951998979e-06, "epoch": 5.5274645325572935, "percentage": 78.96, "elapsed_time": "3:07:38", "remaining_time": "0:49:59"}
|