Training in progress, step 7200
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:510150b1585101cc9ba05b76f03765846c8ce19e4723eeab3847451d588ef8d4
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12a9bc8b42d508a88338ecf639885f7fcba435bdf770d93c8b1fe92c754f28a7
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5adce3c0dd0b8406bd43519082075ed8a8802e1e36cfe9b7fa92da17545fef46
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b880aeaa797806bf0620e9b7a7bfee62512405126eee3c1ec4b7d947561c20d
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -2102,3 +2102,43 @@
|
|
| 2102 |
{"current_steps": 6990, "total_steps": 8169, "loss": 0.1447, "lr": 2.48903926869273e-06, "epoch": 5.989717223650386, "percentage": 85.57, "elapsed_time": "1 day, 19:40:32", "remaining_time": "7:22:00"}
|
| 2103 |
{"current_steps": 6995, "total_steps": 8169, "loss": 0.1581, "lr": 2.468434515428868e-06, "epoch": 5.994001713796059, "percentage": 85.63, "elapsed_time": "1 day, 19:43:01", "remaining_time": "7:20:14"}
|
| 2104 |
{"current_steps": 7000, "total_steps": 8169, "loss": 0.154, "lr": 2.4479097915151438e-06, "epoch": 5.998286203941731, "percentage": 85.69, "elapsed_time": "1 day, 19:45:52", "remaining_time": "7:18:31"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2102 |
{"current_steps": 6990, "total_steps": 8169, "loss": 0.1447, "lr": 2.48903926869273e-06, "epoch": 5.989717223650386, "percentage": 85.57, "elapsed_time": "1 day, 19:40:32", "remaining_time": "7:22:00"}
|
| 2103 |
{"current_steps": 6995, "total_steps": 8169, "loss": 0.1581, "lr": 2.468434515428868e-06, "epoch": 5.994001713796059, "percentage": 85.63, "elapsed_time": "1 day, 19:43:01", "remaining_time": "7:20:14"}
|
| 2104 |
{"current_steps": 7000, "total_steps": 8169, "loss": 0.154, "lr": 2.4479097915151438e-06, "epoch": 5.998286203941731, "percentage": 85.69, "elapsed_time": "1 day, 19:45:52", "remaining_time": "7:18:31"}
|
| 2105 |
+
{"current_steps": 7005, "total_steps": 8169, "loss": 0.1349, "lr": 2.4274651906443026e-06, "epoch": 6.002570694087404, "percentage": 85.75, "elapsed_time": "1 day, 19:50:04", "remaining_time": "7:17:01"}
|
| 2106 |
+
{"current_steps": 7010, "total_steps": 8169, "loss": 0.1307, "lr": 2.407100806143321e-06, "epoch": 6.006855184233077, "percentage": 85.81, "elapsed_time": "1 day, 19:52:55", "remaining_time": "7:15:18"}
|
| 2107 |
+
{"current_steps": 7015, "total_steps": 8169, "loss": 0.1347, "lr": 2.386816730973005e-06, "epoch": 6.011139674378749, "percentage": 85.87, "elapsed_time": "1 day, 19:55:48", "remaining_time": "7:13:36"}
|
| 2108 |
+
{"current_steps": 7020, "total_steps": 8169, "loss": 0.1422, "lr": 2.3666130577275604e-06, "epoch": 6.015424164524422, "percentage": 85.93, "elapsed_time": "1 day, 19:58:43", "remaining_time": "7:11:53"}
|
| 2109 |
+
{"current_steps": 7025, "total_steps": 8169, "loss": 0.1258, "lr": 2.3464898786341615e-06, "epoch": 6.019708654670095, "percentage": 86.0, "elapsed_time": "1 day, 20:01:35", "remaining_time": "7:10:10"}
|
| 2110 |
+
{"current_steps": 7030, "total_steps": 8169, "loss": 0.123, "lr": 2.3264472855525532e-06, "epoch": 6.023993144815767, "percentage": 86.06, "elapsed_time": "1 day, 20:04:35", "remaining_time": "7:08:28"}
|
| 2111 |
+
{"current_steps": 7035, "total_steps": 8169, "loss": 0.1271, "lr": 2.3064853699745936e-06, "epoch": 6.02827763496144, "percentage": 86.12, "elapsed_time": "1 day, 20:07:30", "remaining_time": "7:06:45"}
|
| 2112 |
+
{"current_steps": 7040, "total_steps": 8169, "loss": 0.1378, "lr": 2.2866042230238804e-06, "epoch": 6.032562125107113, "percentage": 86.18, "elapsed_time": "1 day, 20:10:13", "remaining_time": "7:05:00"}
|
| 2113 |
+
{"current_steps": 7045, "total_steps": 8169, "loss": 0.1227, "lr": 2.266803935455295e-06, "epoch": 6.036846615252785, "percentage": 86.24, "elapsed_time": "1 day, 20:13:06", "remaining_time": "7:03:17"}
|
| 2114 |
+
{"current_steps": 7050, "total_steps": 8169, "loss": 0.1244, "lr": 2.2470845976546163e-06, "epoch": 6.041131105398458, "percentage": 86.3, "elapsed_time": "1 day, 20:15:51", "remaining_time": "7:01:32"}
|
| 2115 |
+
{"current_steps": 7055, "total_steps": 8169, "loss": 0.136, "lr": 2.227446299638092e-06, "epoch": 6.045415595544131, "percentage": 86.36, "elapsed_time": "1 day, 20:18:34", "remaining_time": "6:59:47"}
|
| 2116 |
+
{"current_steps": 7060, "total_steps": 8169, "loss": 0.1278, "lr": 2.2078891310520346e-06, "epoch": 6.049700085689803, "percentage": 86.42, "elapsed_time": "1 day, 20:21:13", "remaining_time": "6:58:01"}
|
| 2117 |
+
{"current_steps": 7065, "total_steps": 8169, "loss": 0.1377, "lr": 2.188413181172415e-06, "epoch": 6.053984575835476, "percentage": 86.49, "elapsed_time": "1 day, 20:23:52", "remaining_time": "6:56:15"}
|
| 2118 |
+
{"current_steps": 7070, "total_steps": 8169, "loss": 0.1393, "lr": 2.169018538904455e-06, "epoch": 6.058269065981149, "percentage": 86.55, "elapsed_time": "1 day, 20:26:29", "remaining_time": "6:54:29"}
|
| 2119 |
+
{"current_steps": 7075, "total_steps": 8169, "loss": 0.1329, "lr": 2.149705292782205e-06, "epoch": 6.062553556126821, "percentage": 86.61, "elapsed_time": "1 day, 20:29:11", "remaining_time": "6:52:44"}
|
| 2120 |
+
{"current_steps": 7080, "total_steps": 8169, "loss": 0.1369, "lr": 2.13047353096816e-06, "epoch": 6.066838046272494, "percentage": 86.67, "elapsed_time": "1 day, 20:31:57", "remaining_time": "6:50:59"}
|
| 2121 |
+
{"current_steps": 7085, "total_steps": 8169, "loss": 0.128, "lr": 2.111323341252851e-06, "epoch": 6.071122536418166, "percentage": 86.73, "elapsed_time": "1 day, 20:34:56", "remaining_time": "6:49:15"}
|
| 2122 |
+
{"current_steps": 7090, "total_steps": 8169, "loss": 0.1277, "lr": 2.092254811054437e-06, "epoch": 6.075407026563839, "percentage": 86.79, "elapsed_time": "1 day, 20:37:48", "remaining_time": "6:47:31"}
|
| 2123 |
+
{"current_steps": 7095, "total_steps": 8169, "loss": 0.1186, "lr": 2.073268027418314e-06, "epoch": 6.079691516709511, "percentage": 86.85, "elapsed_time": "1 day, 20:40:36", "remaining_time": "6:45:46"}
|
| 2124 |
+
{"current_steps": 7100, "total_steps": 8169, "loss": 0.1285, "lr": 2.0543630770167166e-06, "epoch": 6.083976006855184, "percentage": 86.91, "elapsed_time": "1 day, 20:43:23", "remaining_time": "6:44:01"}
|
| 2125 |
+
{"current_steps": 7105, "total_steps": 8169, "loss": 0.1439, "lr": 2.0355400461483278e-06, "epoch": 6.0882604970008565, "percentage": 86.98, "elapsed_time": "1 day, 20:46:13", "remaining_time": "6:42:16"}
|
| 2126 |
+
{"current_steps": 7110, "total_steps": 8169, "loss": 0.1355, "lr": 2.0167990207378696e-06, "epoch": 6.092544987146529, "percentage": 87.04, "elapsed_time": "1 day, 20:48:56", "remaining_time": "6:40:30"}
|
| 2127 |
+
{"current_steps": 7115, "total_steps": 8169, "loss": 0.134, "lr": 1.998140086335718e-06, "epoch": 6.096829477292202, "percentage": 87.1, "elapsed_time": "1 day, 20:51:53", "remaining_time": "6:38:46"}
|
| 2128 |
+
{"current_steps": 7120, "total_steps": 8169, "loss": 0.1155, "lr": 1.97956332811752e-06, "epoch": 6.1011139674378745, "percentage": 87.16, "elapsed_time": "1 day, 20:54:45", "remaining_time": "6:37:01"}
|
| 2129 |
+
{"current_steps": 7125, "total_steps": 8169, "loss": 0.1395, "lr": 1.96106883088379e-06, "epoch": 6.105398457583547, "percentage": 87.22, "elapsed_time": "1 day, 20:57:36", "remaining_time": "6:35:16"}
|
| 2130 |
+
{"current_steps": 7130, "total_steps": 8169, "loss": 0.1219, "lr": 1.942656679059547e-06, "epoch": 6.10968294772922, "percentage": 87.28, "elapsed_time": "1 day, 21:00:33", "remaining_time": "6:33:31"}
|
| 2131 |
+
{"current_steps": 7135, "total_steps": 8169, "loss": 0.1274, "lr": 1.924326956693905e-06, "epoch": 6.1139674378748925, "percentage": 87.34, "elapsed_time": "1 day, 21:03:30", "remaining_time": "6:31:47"}
|
| 2132 |
+
{"current_steps": 7140, "total_steps": 8169, "loss": 0.1355, "lr": 1.906079747459695e-06, "epoch": 6.118251928020565, "percentage": 87.4, "elapsed_time": "1 day, 21:06:23", "remaining_time": "6:30:02"}
|
| 2133 |
+
{"current_steps": 7145, "total_steps": 8169, "loss": 0.138, "lr": 1.8879151346530889e-06, "epoch": 6.122536418166238, "percentage": 87.46, "elapsed_time": "1 day, 21:09:04", "remaining_time": "6:28:15"}
|
| 2134 |
+
{"current_steps": 7150, "total_steps": 8169, "loss": 0.1327, "lr": 1.8698332011932164e-06, "epoch": 6.1268209083119105, "percentage": 87.53, "elapsed_time": "1 day, 21:11:54", "remaining_time": "6:26:29"}
|
| 2135 |
+
{"current_steps": 7155, "total_steps": 8169, "loss": 0.1362, "lr": 1.8518340296217907e-06, "epoch": 6.131105398457583, "percentage": 87.59, "elapsed_time": "1 day, 21:14:58", "remaining_time": "6:24:45"}
|
| 2136 |
+
{"current_steps": 7160, "total_steps": 8169, "loss": 0.1332, "lr": 1.8339177021027144e-06, "epoch": 6.135389888603256, "percentage": 87.65, "elapsed_time": "1 day, 21:17:40", "remaining_time": "6:22:58"}
|
| 2137 |
+
{"current_steps": 7165, "total_steps": 8169, "loss": 0.1328, "lr": 1.8160843004217344e-06, "epoch": 6.1396743787489285, "percentage": 87.71, "elapsed_time": "1 day, 21:20:29", "remaining_time": "6:21:12"}
|
| 2138 |
+
{"current_steps": 7170, "total_steps": 8169, "loss": 0.1519, "lr": 1.7983339059860472e-06, "epoch": 6.143958868894601, "percentage": 87.77, "elapsed_time": "1 day, 21:23:20", "remaining_time": "6:19:26"}
|
| 2139 |
+
{"current_steps": 7175, "total_steps": 8169, "loss": 0.1361, "lr": 1.780666599823926e-06, "epoch": 6.148243359040274, "percentage": 87.83, "elapsed_time": "1 day, 21:26:14", "remaining_time": "6:17:41"}
|
| 2140 |
+
{"current_steps": 7180, "total_steps": 8169, "loss": 0.1262, "lr": 1.7630824625843579e-06, "epoch": 6.1525278491859465, "percentage": 87.89, "elapsed_time": "1 day, 21:29:16", "remaining_time": "6:15:56"}
|
| 2141 |
+
{"current_steps": 7185, "total_steps": 8169, "loss": 0.146, "lr": 1.745581574536679e-06, "epoch": 6.156812339331619, "percentage": 87.95, "elapsed_time": "1 day, 21:32:06", "remaining_time": "6:14:10"}
|
| 2142 |
+
{"current_steps": 7190, "total_steps": 8169, "loss": 0.1267, "lr": 1.728164015570195e-06, "epoch": 6.161096829477292, "percentage": 88.02, "elapsed_time": "1 day, 21:35:03", "remaining_time": "6:12:24"}
|
| 2143 |
+
{"current_steps": 7195, "total_steps": 8169, "loss": 0.134, "lr": 1.7108298651938393e-06, "epoch": 6.1653813196229645, "percentage": 88.08, "elapsed_time": "1 day, 21:37:53", "remaining_time": "6:10:37"}
|
| 2144 |
+
{"current_steps": 7200, "total_steps": 8169, "loss": 0.1252, "lr": 1.69357920253578e-06, "epoch": 6.169665809768637, "percentage": 88.14, "elapsed_time": "1 day, 21:40:35", "remaining_time": "6:08:50"}
|