Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a34a9e5b25cd1055ae7aa0bfcf0a258f56c65dd7df68759753bf70c20f84ff4
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f32c62b39bf8f4073dcadb2b49178f70ad45348736cee00ac3795f7b813b259a
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4be9c18016feb23c1d34f5732268794381043bc2366fa72b1022896a648c8a5d
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bef089507508ddaa4833aed8a2ad3bb0991e46b9f6b42c37e0d4ee6ce781585
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -55,3 +55,31 @@
|
|
| 55 |
{"current_steps": 55, "total_steps": 84, "loss": 0.7228, "lr": 2.6057118107127402e-05, "epoch": 1.9262472885032538, "percentage": 65.48, "elapsed_time": "2:23:34", "remaining_time": "1:15:42"}
|
| 56 |
{"current_steps": 56, "total_steps": 84, "loss": 0.7208, "lr": 2.4499376541915883e-05, "epoch": 1.9609544468546638, "percentage": 66.67, "elapsed_time": "2:26:07", "remaining_time": "1:13:03"}
|
| 57 |
{"current_steps": 57, "total_steps": 84, "loss": 1.1849, "lr": 2.2968828337397095e-05, "epoch": 2.013015184381779, "percentage": 67.86, "elapsed_time": "2:30:19", "remaining_time": "1:11:12"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 55 |
{"current_steps": 55, "total_steps": 84, "loss": 0.7228, "lr": 2.6057118107127402e-05, "epoch": 1.9262472885032538, "percentage": 65.48, "elapsed_time": "2:23:34", "remaining_time": "1:15:42"}
|
| 56 |
{"current_steps": 56, "total_steps": 84, "loss": 0.7208, "lr": 2.4499376541915883e-05, "epoch": 1.9609544468546638, "percentage": 66.67, "elapsed_time": "2:26:07", "remaining_time": "1:13:03"}
|
| 57 |
{"current_steps": 57, "total_steps": 84, "loss": 1.1849, "lr": 2.2968828337397095e-05, "epoch": 2.013015184381779, "percentage": 67.86, "elapsed_time": "2:30:19", "remaining_time": "1:11:12"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 84, "loss": 0.6845, "lr": 2.1468158595205543e-05, "epoch": 2.0477223427331888, "percentage": 69.05, "elapsed_time": "2:32:52", "remaining_time": "1:08:31"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 84, "loss": 0.681, "lr": 2.0000000000000012e-05, "epoch": 2.0824295010845986, "percentage": 70.24, "elapsed_time": "2:35:26", "remaining_time": "1:05:51"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 84, "loss": 0.6803, "lr": 1.8566928200840128e-05, "epoch": 2.117136659436009, "percentage": 71.43, "elapsed_time": "2:37:59", "remaining_time": "1:03:11"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 84, "loss": 0.6756, "lr": 1.7171457292622736e-05, "epoch": 2.1518438177874186, "percentage": 72.62, "elapsed_time": "2:40:33", "remaining_time": "1:00:32"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 84, "loss": 0.6713, "lr": 1.5816035405505007e-05, "epoch": 2.1865509761388284, "percentage": 73.81, "elapsed_time": "2:43:06", "remaining_time": "0:57:52"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 84, "loss": 0.6778, "lr": 1.4503040410052412e-05, "epoch": 2.2212581344902387, "percentage": 75.0, "elapsed_time": "2:45:39", "remaining_time": "0:55:13"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 84, "loss": 0.6733, "lr": 1.3234775745645684e-05, "epoch": 2.2559652928416485, "percentage": 76.19, "elapsed_time": "2:48:12", "remaining_time": "0:52:33"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 84, "loss": 0.673, "lr": 1.201346637946538e-05, "epoch": 2.2906724511930587, "percentage": 77.38, "elapsed_time": "2:50:45", "remaining_time": "0:49:54"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 84, "loss": 0.6758, "lr": 1.0841254903143547e-05, "epoch": 2.3253796095444685, "percentage": 78.57, "elapsed_time": "2:53:18", "remaining_time": "0:47:15"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 84, "loss": 0.6708, "lr": 9.720197773929749e-06, "epoch": 2.3600867678958783, "percentage": 79.76, "elapsed_time": "2:55:51", "remaining_time": "0:44:37"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 84, "loss": 0.6694, "lr": 8.652261706966412e-06, "epoch": 2.3947939262472886, "percentage": 80.95, "elapsed_time": "2:58:26", "remaining_time": "0:41:59"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 84, "loss": 0.6749, "lr": 7.639320225002106e-06, "epoch": 2.4295010845986984, "percentage": 82.14, "elapsed_time": "3:00:59", "remaining_time": "0:39:20"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 84, "loss": 0.6752, "lr": 6.6831503715960235e-06, "epoch": 2.4642082429501087, "percentage": 83.33, "elapsed_time": "3:03:33", "remaining_time": "0:36:42"}
|
| 71 |
+
{"current_steps": 71, "total_steps": 84, "loss": 0.6781, "lr": 5.785429593579736e-06, "epoch": 2.4989154013015185, "percentage": 84.52, "elapsed_time": "3:06:06", "remaining_time": "0:34:04"}
|
| 72 |
+
{"current_steps": 72, "total_steps": 84, "loss": 0.6716, "lr": 4.947732798245466e-06, "epoch": 2.5336225596529283, "percentage": 85.71, "elapsed_time": "3:08:40", "remaining_time": "0:31:26"}
|
| 73 |
+
{"current_steps": 73, "total_steps": 84, "loss": 0.6779, "lr": 4.171529590423484e-06, "epoch": 2.5683297180043385, "percentage": 86.9, "elapsed_time": "3:11:13", "remaining_time": "0:28:48"}
|
| 74 |
+
{"current_steps": 74, "total_steps": 84, "loss": 0.6805, "lr": 3.458181694295961e-06, "epoch": 2.6030368763557483, "percentage": 88.1, "elapsed_time": "3:13:47", "remaining_time": "0:26:11"}
|
| 75 |
+
{"current_steps": 75, "total_steps": 84, "loss": 0.6719, "lr": 2.8089405644699463e-06, "epoch": 2.6377440347071586, "percentage": 89.29, "elapsed_time": "3:16:21", "remaining_time": "0:23:33"}
|
| 76 |
+
{"current_steps": 76, "total_steps": 84, "loss": 0.675, "lr": 2.2249451905007603e-06, "epoch": 2.6724511930585684, "percentage": 90.48, "elapsed_time": "3:18:54", "remaining_time": "0:20:56"}
|
| 77 |
+
{"current_steps": 77, "total_steps": 84, "loss": 0.6767, "lr": 1.7072200987173105e-06, "epoch": 2.707158351409978, "percentage": 91.67, "elapsed_time": "3:21:26", "remaining_time": "0:18:18"}
|
| 78 |
+
{"current_steps": 78, "total_steps": 84, "loss": 0.6633, "lr": 1.256673554854757e-06, "epoch": 2.7418655097613884, "percentage": 92.86, "elapsed_time": "3:23:59", "remaining_time": "0:15:41"}
|
| 79 |
+
{"current_steps": 79, "total_steps": 84, "loss": 0.6672, "lr": 8.740959706477725e-07, "epoch": 2.7765726681127982, "percentage": 94.05, "elapsed_time": "3:26:32", "remaining_time": "0:13:04"}
|
| 80 |
+
{"current_steps": 80, "total_steps": 84, "loss": 0.6708, "lr": 5.601585171798052e-07, "epoch": 2.811279826464208, "percentage": 95.24, "elapsed_time": "3:29:05", "remaining_time": "0:10:27"}
|
| 81 |
+
{"current_steps": 81, "total_steps": 84, "loss": 0.6748, "lr": 3.154119474208894e-07, "epoch": 2.8459869848156183, "percentage": 96.43, "elapsed_time": "3:31:38", "remaining_time": "0:07:50"}
|
| 82 |
+
{"current_steps": 82, "total_steps": 84, "loss": 0.6686, "lr": 1.402856300198252e-07, "epoch": 2.880694143167028, "percentage": 97.62, "elapsed_time": "3:34:10", "remaining_time": "0:05:13"}
|
| 83 |
+
{"current_steps": 83, "total_steps": 84, "loss": 0.662, "lr": 3.5086796045664674e-08, "epoch": 2.915401301518438, "percentage": 98.81, "elapsed_time": "3:36:43", "remaining_time": "0:02:36"}
|
| 84 |
+
{"current_steps": 84, "total_steps": 84, "loss": 0.673, "lr": 0.0, "epoch": 2.950108459869848, "percentage": 100.0, "elapsed_time": "3:39:16", "remaining_time": "0:00:00"}
|
| 85 |
+
{"current_steps": 84, "total_steps": 84, "epoch": 2.950108459869848, "percentage": 100.0, "elapsed_time": "3:40:52", "remaining_time": "0:00:00"}
|