Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:289fbdd3278cc741d2ecefbbc382b926e2f10f15989e6861dd369ff7b9f9a3e6
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25ffa792e41ff8816be4609eb15a9817a6ace5265c8838ecab52ed501165ccaa
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f82fd0022ea67e460d1ea2c170c883eefacaec923c375d5c2b5b17e6bee15aaf
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fd5742327cbd950239c1de000c210e156ec6d2d6abba2c0f8c5e11d050e26de
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -128,3 +128,60 @@
|
|
| 128 |
{"current_steps": 128, "total_steps": 186, "loss": 0.6588, "lr": 2.6924157895271563e-06, "epoch": 2.048, "percentage": 68.82, "elapsed_time": "1:50:10", "remaining_time": "0:49:55"}
|
| 129 |
{"current_steps": 129, "total_steps": 186, "loss": 0.7366, "lr": 2.6093857305493666e-06, "epoch": 2.064, "percentage": 69.35, "elapsed_time": "1:51:12", "remaining_time": "0:49:08"}
|
| 130 |
{"current_steps": 130, "total_steps": 186, "loss": 0.634, "lr": 2.5272016582081236e-06, "epoch": 2.08, "percentage": 69.89, "elapsed_time": "1:51:53", "remaining_time": "0:48:11"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 128 |
{"current_steps": 128, "total_steps": 186, "loss": 0.6588, "lr": 2.6924157895271563e-06, "epoch": 2.048, "percentage": 68.82, "elapsed_time": "1:50:10", "remaining_time": "0:49:55"}
|
| 129 |
{"current_steps": 129, "total_steps": 186, "loss": 0.7366, "lr": 2.6093857305493666e-06, "epoch": 2.064, "percentage": 69.35, "elapsed_time": "1:51:12", "remaining_time": "0:49:08"}
|
| 130 |
{"current_steps": 130, "total_steps": 186, "loss": 0.634, "lr": 2.5272016582081236e-06, "epoch": 2.08, "percentage": 69.89, "elapsed_time": "1:51:53", "remaining_time": "0:48:11"}
|
| 131 |
+
{"current_steps": 131, "total_steps": 186, "loss": 0.7273, "lr": 2.445892655667462e-06, "epoch": 2.096, "percentage": 70.43, "elapsed_time": "1:52:44", "remaining_time": "0:47:20"}
|
| 132 |
+
{"current_steps": 132, "total_steps": 186, "loss": 0.7158, "lr": 2.365487496423152e-06, "epoch": 2.112, "percentage": 70.97, "elapsed_time": "1:53:33", "remaining_time": "0:46:27"}
|
| 133 |
+
{"current_steps": 133, "total_steps": 186, "loss": 0.674, "lr": 2.2860146341203936e-06, "epoch": 2.128, "percentage": 71.51, "elapsed_time": "1:54:18", "remaining_time": "0:45:33"}
|
| 134 |
+
{"current_steps": 134, "total_steps": 186, "loss": 0.7368, "lr": 2.207502192484685e-06, "epoch": 2.144, "percentage": 72.04, "elapsed_time": "1:55:13", "remaining_time": "0:44:42"}
|
| 135 |
+
{"current_steps": 135, "total_steps": 186, "loss": 0.7117, "lr": 2.1299779553694323e-06, "epoch": 2.16, "percentage": 72.58, "elapsed_time": "1:56:02", "remaining_time": "0:43:50"}
|
| 136 |
+
{"current_steps": 136, "total_steps": 186, "loss": 0.6312, "lr": 2.053469356923865e-06, "epoch": 2.176, "percentage": 73.12, "elapsed_time": "1:56:42", "remaining_time": "0:42:54"}
|
| 137 |
+
{"current_steps": 137, "total_steps": 186, "loss": 0.7096, "lr": 1.9780034718846653e-06, "epoch": 2.192, "percentage": 73.66, "elapsed_time": "1:57:21", "remaining_time": "0:41:58"}
|
| 138 |
+
{"current_steps": 138, "total_steps": 186, "loss": 0.6783, "lr": 1.9036070059948253e-06, "epoch": 2.208, "percentage": 74.19, "elapsed_time": "1:58:03", "remaining_time": "0:41:03"}
|
| 139 |
+
{"current_steps": 139, "total_steps": 186, "loss": 0.7526, "lr": 1.8303062865530407e-06, "epoch": 2.224, "percentage": 74.73, "elapsed_time": "1:58:52", "remaining_time": "0:40:11"}
|
| 140 |
+
{"current_steps": 140, "total_steps": 186, "loss": 0.7312, "lr": 1.7581272530970666e-06, "epoch": 2.24, "percentage": 75.27, "elapsed_time": "1:59:48", "remaining_time": "0:39:21"}
|
| 141 |
+
{"current_steps": 141, "total_steps": 186, "loss": 0.6695, "lr": 1.6870954482242707e-06, "epoch": 2.2560000000000002, "percentage": 75.81, "elapsed_time": "2:00:35", "remaining_time": "0:38:29"}
|
| 142 |
+
{"current_steps": 142, "total_steps": 186, "loss": 0.6941, "lr": 1.6172360085526567e-06, "epoch": 2.2720000000000002, "percentage": 76.34, "elapsed_time": "2:01:23", "remaining_time": "0:37:36"}
|
| 143 |
+
{"current_steps": 143, "total_steps": 186, "loss": 0.6693, "lr": 1.54857365582557e-06, "epoch": 2.288, "percentage": 76.88, "elapsed_time": "2:02:14", "remaining_time": "0:36:45"}
|
| 144 |
+
{"current_steps": 144, "total_steps": 186, "loss": 0.6711, "lr": 1.4811326881631937e-06, "epoch": 2.304, "percentage": 77.42, "elapsed_time": "2:03:03", "remaining_time": "0:35:53"}
|
| 145 |
+
{"current_steps": 145, "total_steps": 186, "loss": 0.7054, "lr": 1.4149369714639856e-06, "epoch": 2.32, "percentage": 77.96, "elapsed_time": "2:04:04", "remaining_time": "0:35:04"}
|
| 146 |
+
{"current_steps": 146, "total_steps": 186, "loss": 0.625, "lr": 1.3500099309590397e-06, "epoch": 2.336, "percentage": 78.49, "elapsed_time": "2:04:50", "remaining_time": "0:34:12"}
|
| 147 |
+
{"current_steps": 147, "total_steps": 186, "loss": 0.6545, "lr": 1.2863745429224145e-06, "epoch": 2.352, "percentage": 79.03, "elapsed_time": "2:05:42", "remaining_time": "0:33:21"}
|
| 148 |
+
{"current_steps": 148, "total_steps": 186, "loss": 0.7246, "lr": 1.22405332654032e-06, "epoch": 2.368, "percentage": 79.57, "elapsed_time": "2:06:32", "remaining_time": "0:32:29"}
|
| 149 |
+
{"current_steps": 149, "total_steps": 186, "loss": 0.7389, "lr": 1.1630683359420653e-06, "epoch": 2.384, "percentage": 80.11, "elapsed_time": "2:07:30", "remaining_time": "0:31:39"}
|
| 150 |
+
{"current_steps": 150, "total_steps": 186, "loss": 0.6475, "lr": 1.103441152395588e-06, "epoch": 2.4, "percentage": 80.65, "elapsed_time": "2:08:13", "remaining_time": "0:30:46"}
|
| 151 |
+
{"current_steps": 151, "total_steps": 186, "loss": 0.7146, "lr": 1.045192876670298e-06, "epoch": 2.416, "percentage": 81.18, "elapsed_time": "2:09:13", "remaining_time": "0:29:57"}
|
| 152 |
+
{"current_steps": 152, "total_steps": 186, "loss": 0.724, "lr": 9.883441215699824e-07, "epoch": 2.432, "percentage": 81.72, "elapsed_time": "2:10:08", "remaining_time": "0:29:06"}
|
| 153 |
+
{"current_steps": 153, "total_steps": 186, "loss": 0.6687, "lr": 9.329150046383773e-07, "epoch": 2.448, "percentage": 82.26, "elapsed_time": "2:10:52", "remaining_time": "0:28:13"}
|
| 154 |
+
{"current_steps": 154, "total_steps": 186, "loss": 0.7853, "lr": 8.789251410400024e-07, "epoch": 2.464, "percentage": 82.8, "elapsed_time": "2:12:00", "remaining_time": "0:27:25"}
|
| 155 |
+
{"current_steps": 155, "total_steps": 186, "loss": 0.7102, "lr": 8.263936366187825e-07, "epoch": 2.48, "percentage": 83.33, "elapsed_time": "2:12:49", "remaining_time": "0:26:33"}
|
| 156 |
+
{"current_steps": 156, "total_steps": 186, "loss": 0.7436, "lr": 7.753390811368972e-07, "epoch": 2.496, "percentage": 83.87, "elapsed_time": "2:13:42", "remaining_time": "0:25:42"}
|
| 157 |
+
{"current_steps": 157, "total_steps": 186, "loss": 0.684, "lr": 7.257795416962754e-07, "epoch": 2.512, "percentage": 84.41, "elapsed_time": "2:14:31", "remaining_time": "0:24:50"}
|
| 158 |
+
{"current_steps": 158, "total_steps": 186, "loss": 0.6822, "lr": 6.777325563450282e-07, "epoch": 2.528, "percentage": 84.95, "elapsed_time": "2:15:13", "remaining_time": "0:23:57"}
|
| 159 |
+
{"current_steps": 159, "total_steps": 186, "loss": 0.706, "lr": 6.312151278711237e-07, "epoch": 2.544, "percentage": 85.48, "elapsed_time": "2:16:02", "remaining_time": "0:23:06"}
|
| 160 |
+
{"current_steps": 160, "total_steps": 186, "loss": 0.7186, "lr": 5.862437177854629e-07, "epoch": 2.56, "percentage": 86.02, "elapsed_time": "2:16:46", "remaining_time": "0:22:13"}
|
| 161 |
+
{"current_steps": 161, "total_steps": 186, "loss": 0.7398, "lr": 5.428342404965076e-07, "epoch": 2.576, "percentage": 86.56, "elapsed_time": "2:17:40", "remaining_time": "0:21:22"}
|
| 162 |
+
{"current_steps": 162, "total_steps": 186, "loss": 0.6833, "lr": 5.010020576785174e-07, "epoch": 2.592, "percentage": 87.1, "elapsed_time": "2:18:30", "remaining_time": "0:20:31"}
|
| 163 |
+
{"current_steps": 163, "total_steps": 186, "loss": 0.6949, "lr": 4.607619728353818e-07, "epoch": 2.608, "percentage": 87.63, "elapsed_time": "2:19:16", "remaining_time": "0:19:39"}
|
| 164 |
+
{"current_steps": 164, "total_steps": 186, "loss": 0.6992, "lr": 4.221282260619891e-07, "epoch": 2.624, "percentage": 88.17, "elapsed_time": "2:20:04", "remaining_time": "0:18:47"}
|
| 165 |
+
{"current_steps": 165, "total_steps": 186, "loss": 0.7146, "lr": 3.851144890049535e-07, "epoch": 2.64, "percentage": 88.71, "elapsed_time": "2:20:56", "remaining_time": "0:17:56"}
|
| 166 |
+
{"current_steps": 166, "total_steps": 186, "loss": 0.6423, "lr": 3.497338600245254e-07, "epoch": 2.656, "percentage": 89.25, "elapsed_time": "2:21:39", "remaining_time": "0:17:04"}
|
| 167 |
+
{"current_steps": 167, "total_steps": 186, "loss": 0.6919, "lr": 3.159988595593616e-07, "epoch": 2.672, "percentage": 89.78, "elapsed_time": "2:22:32", "remaining_time": "0:16:13"}
|
| 168 |
+
{"current_steps": 168, "total_steps": 186, "loss": 0.7524, "lr": 2.839214256958106e-07, "epoch": 2.6879999999999997, "percentage": 90.32, "elapsed_time": "2:23:31", "remaining_time": "0:15:22"}
|
| 169 |
+
{"current_steps": 169, "total_steps": 186, "loss": 0.7457, "lr": 2.5351290994328703e-07, "epoch": 2.7039999999999997, "percentage": 90.86, "elapsed_time": "2:24:22", "remaining_time": "0:14:31"}
|
| 170 |
+
{"current_steps": 170, "total_steps": 186, "loss": 0.747, "lr": 2.2478407321721295e-07, "epoch": 2.7199999999999998, "percentage": 91.4, "elapsed_time": "2:25:16", "remaining_time": "0:13:40"}
|
| 171 |
+
{"current_steps": 171, "total_steps": 186, "loss": 0.7235, "lr": 1.9774508203096843e-07, "epoch": 2.7359999999999998, "percentage": 91.94, "elapsed_time": "2:26:06", "remaining_time": "0:12:48"}
|
| 172 |
+
{"current_steps": 172, "total_steps": 186, "loss": 0.6887, "lr": 1.7240550489817652e-07, "epoch": 2.752, "percentage": 92.47, "elapsed_time": "2:27:02", "remaining_time": "0:11:58"}
|
| 173 |
+
{"current_steps": 173, "total_steps": 186, "loss": 0.7928, "lr": 1.4877430894662037e-07, "epoch": 2.768, "percentage": 93.01, "elapsed_time": "2:27:44", "remaining_time": "0:11:06"}
|
| 174 |
+
{"current_steps": 174, "total_steps": 186, "loss": 0.7622, "lr": 1.268598567449647e-07, "epoch": 2.784, "percentage": 93.55, "elapsed_time": "2:28:33", "remaining_time": "0:10:14"}
|
| 175 |
+
{"current_steps": 175, "total_steps": 186, "loss": 0.716, "lr": 1.0666990334342708e-07, "epoch": 2.8, "percentage": 94.09, "elapsed_time": "2:29:22", "remaining_time": "0:09:23"}
|
| 176 |
+
{"current_steps": 176, "total_steps": 186, "loss": 0.6963, "lr": 8.821159352943142e-08, "epoch": 2.816, "percentage": 94.62, "elapsed_time": "2:30:21", "remaining_time": "0:08:32"}
|
| 177 |
+
{"current_steps": 177, "total_steps": 186, "loss": 0.6921, "lr": 7.149145929922607e-08, "epoch": 2.832, "percentage": 95.16, "elapsed_time": "2:31:06", "remaining_time": "0:07:41"}
|
| 178 |
+
{"current_steps": 178, "total_steps": 186, "loss": 0.7491, "lr": 5.651541754634726e-08, "epoch": 2.848, "percentage": 95.7, "elapsed_time": "2:31:50", "remaining_time": "0:06:49"}
|
| 179 |
+
{"current_steps": 179, "total_steps": 186, "loss": 0.6694, "lr": 4.328876796776071e-08, "epoch": 2.864, "percentage": 96.24, "elapsed_time": "2:32:42", "remaining_time": "0:05:58"}
|
| 180 |
+
{"current_steps": 180, "total_steps": 186, "loss": 0.7126, "lr": 3.181619118841517e-08, "epoch": 2.88, "percentage": 96.77, "elapsed_time": "2:33:23", "remaining_time": "0:05:06"}
|
| 181 |
+
{"current_steps": 181, "total_steps": 186, "loss": 0.6724, "lr": 2.210174710486679e-08, "epoch": 2.896, "percentage": 97.31, "elapsed_time": "2:34:17", "remaining_time": "0:04:15"}
|
| 182 |
+
{"current_steps": 182, "total_steps": 186, "loss": 0.7101, "lr": 1.4148873448573408e-08, "epoch": 2.912, "percentage": 97.85, "elapsed_time": "2:35:07", "remaining_time": "0:03:24"}
|
| 183 |
+
{"current_steps": 183, "total_steps": 186, "loss": 0.7491, "lr": 7.96038456935322e-09, "epoch": 2.928, "percentage": 98.39, "elapsed_time": "2:35:53", "remaining_time": "0:02:33"}
|
| 184 |
+
{"current_steps": 184, "total_steps": 186, "loss": 0.7011, "lr": 3.538470439448105e-09, "epoch": 2.944, "percentage": 98.92, "elapsed_time": "2:36:48", "remaining_time": "0:01:42"}
|
| 185 |
+
{"current_steps": 185, "total_steps": 186, "loss": 0.7158, "lr": 8.846958785418969e-10, "epoch": 2.96, "percentage": 99.46, "elapsed_time": "2:37:37", "remaining_time": "0:00:51"}
|
| 186 |
+
{"current_steps": 186, "total_steps": 186, "loss": 0.7134, "lr": 0.0, "epoch": 2.976, "percentage": 100.0, "elapsed_time": "2:38:36", "remaining_time": "0:00:00"}
|
| 187 |
+
{"current_steps": 186, "total_steps": 186, "epoch": 2.976, "percentage": 100.0, "elapsed_time": "2:40:45", "remaining_time": "0:00:00"}
|