Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:051d5668a04cc82311647f0e61fd60cf01d4d5e94004f6397c71d3a8a3da76c4
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35ba29e4dfcdb83ec3838a8933550af71351c21be97e2dc957f374195a53b449
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79d8bef13c386a820ecc00732522b5e4e85e8e93cfba5a986264652edd9bb573
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d538d8fa19241687206f65046e9ce847e7cd3028840eba86b1001974f2040ba1
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -80,3 +80,42 @@
|
|
| 80 |
{"current_steps": 80, "total_steps": 190, "loss": 0.3866, "lr": 2.8701313729641467e-05, "epoch": 2.0844155844155843, "percentage": 42.11, "elapsed_time": "0:31:58", "remaining_time": "0:43:58"}
|
| 81 |
{"current_steps": 81, "total_steps": 190, "loss": 0.3825, "lr": 2.8369023454079223e-05, "epoch": 2.1103896103896105, "percentage": 42.63, "elapsed_time": "0:32:18", "remaining_time": "0:43:29"}
|
| 82 |
{"current_steps": 82, "total_steps": 190, "loss": 0.3714, "lr": 2.8033908493059394e-05, "epoch": 2.1363636363636362, "percentage": 43.16, "elapsed_time": "0:32:40", "remaining_time": "0:43:02"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 80 |
{"current_steps": 80, "total_steps": 190, "loss": 0.3866, "lr": 2.8701313729641467e-05, "epoch": 2.0844155844155843, "percentage": 42.11, "elapsed_time": "0:31:58", "remaining_time": "0:43:58"}
|
| 81 |
{"current_steps": 81, "total_steps": 190, "loss": 0.3825, "lr": 2.8369023454079223e-05, "epoch": 2.1103896103896105, "percentage": 42.63, "elapsed_time": "0:32:18", "remaining_time": "0:43:29"}
|
| 82 |
{"current_steps": 82, "total_steps": 190, "loss": 0.3714, "lr": 2.8033908493059394e-05, "epoch": 2.1363636363636362, "percentage": 43.16, "elapsed_time": "0:32:40", "remaining_time": "0:43:02"}
|
| 83 |
+
{"current_steps": 83, "total_steps": 190, "loss": 0.3888, "lr": 2.7696081953488917e-05, "epoch": 2.1623376623376624, "percentage": 43.68, "elapsed_time": "0:33:03", "remaining_time": "0:42:37"}
|
| 84 |
+
{"current_steps": 84, "total_steps": 190, "loss": 0.3642, "lr": 2.735565785747787e-05, "epoch": 2.188311688311688, "percentage": 44.21, "elapsed_time": "0:33:25", "remaining_time": "0:42:11"}
|
| 85 |
+
{"current_steps": 85, "total_steps": 190, "loss": 0.3783, "lr": 2.7012751103855092e-05, "epoch": 2.2142857142857144, "percentage": 44.74, "elapsed_time": "0:33:47", "remaining_time": "0:41:44"}
|
| 86 |
+
{"current_steps": 86, "total_steps": 190, "loss": 0.3754, "lr": 2.6667477429387915e-05, "epoch": 2.24025974025974, "percentage": 45.26, "elapsed_time": "0:34:08", "remaining_time": "0:41:17"}
|
| 87 |
+
{"current_steps": 87, "total_steps": 190, "loss": 0.3473, "lr": 2.6319953369719057e-05, "epoch": 2.2662337662337664, "percentage": 45.79, "elapsed_time": "0:34:34", "remaining_time": "0:40:56"}
|
| 88 |
+
{"current_steps": 88, "total_steps": 190, "loss": 0.3471, "lr": 2.5970296220033894e-05, "epoch": 2.292207792207792, "percentage": 46.32, "elapsed_time": "0:35:01", "remaining_time": "0:40:35"}
|
| 89 |
+
{"current_steps": 89, "total_steps": 190, "loss": 0.3837, "lr": 2.5618623995471394e-05, "epoch": 2.3181818181818183, "percentage": 46.84, "elapsed_time": "0:35:22", "remaining_time": "0:40:08"}
|
| 90 |
+
{"current_steps": 90, "total_steps": 190, "loss": 0.3528, "lr": 2.5265055391291986e-05, "epoch": 2.344155844155844, "percentage": 47.37, "elapsed_time": "0:35:47", "remaining_time": "0:39:45"}
|
| 91 |
+
{"current_steps": 91, "total_steps": 190, "loss": 0.3649, "lr": 2.4909709742815986e-05, "epoch": 2.3701298701298703, "percentage": 47.89, "elapsed_time": "0:36:13", "remaining_time": "0:39:24"}
|
| 92 |
+
{"current_steps": 92, "total_steps": 190, "loss": 0.3669, "lr": 2.4552706985145873e-05, "epoch": 2.396103896103896, "percentage": 48.42, "elapsed_time": "0:36:31", "remaining_time": "0:38:54"}
|
| 93 |
+
{"current_steps": 93, "total_steps": 190, "loss": 0.3532, "lr": 2.4194167612686208e-05, "epoch": 2.4220779220779223, "percentage": 48.95, "elapsed_time": "0:36:50", "remaining_time": "0:38:25"}
|
| 94 |
+
{"current_steps": 94, "total_steps": 190, "loss": 0.3657, "lr": 2.3834212638474773e-05, "epoch": 2.448051948051948, "percentage": 49.47, "elapsed_time": "0:37:10", "remaining_time": "0:37:58"}
|
| 95 |
+
{"current_steps": 95, "total_steps": 190, "loss": 0.3621, "lr": 2.3472963553338614e-05, "epoch": 2.474025974025974, "percentage": 50.0, "elapsed_time": "0:37:29", "remaining_time": "0:37:29"}
|
| 96 |
+
{"current_steps": 96, "total_steps": 190, "loss": 0.3467, "lr": 2.3110542284888866e-05, "epoch": 2.5, "percentage": 50.53, "elapsed_time": "0:37:46", "remaining_time": "0:36:59"}
|
| 97 |
+
{"current_steps": 97, "total_steps": 190, "loss": 0.3624, "lr": 2.2747071156368166e-05, "epoch": 2.525974025974026, "percentage": 51.05, "elapsed_time": "0:38:12", "remaining_time": "0:36:38"}
|
| 98 |
+
{"current_steps": 98, "total_steps": 190, "loss": 0.3564, "lr": 2.2382672845364474e-05, "epoch": 2.551948051948052, "percentage": 51.58, "elapsed_time": "0:38:34", "remaining_time": "0:36:13"}
|
| 99 |
+
{"current_steps": 99, "total_steps": 190, "loss": 0.3658, "lr": 2.201747034240537e-05, "epoch": 2.5779220779220777, "percentage": 52.11, "elapsed_time": "0:38:59", "remaining_time": "0:35:50"}
|
| 100 |
+
{"current_steps": 100, "total_steps": 190, "loss": 0.3473, "lr": 2.165158690944665e-05, "epoch": 2.603896103896104, "percentage": 52.63, "elapsed_time": "0:39:20", "remaining_time": "0:35:24"}
|
| 101 |
+
{"current_steps": 101, "total_steps": 190, "loss": 0.3416, "lr": 2.1285146038269406e-05, "epoch": 2.62987012987013, "percentage": 53.16, "elapsed_time": "0:39:46", "remaining_time": "0:35:03"}
|
| 102 |
+
{"current_steps": 102, "total_steps": 190, "loss": 0.3448, "lr": 2.091827140879944e-05, "epoch": 2.655844155844156, "percentage": 53.68, "elapsed_time": "0:40:17", "remaining_time": "0:34:45"}
|
| 103 |
+
{"current_steps": 103, "total_steps": 190, "loss": 0.3433, "lr": 2.0551086847363245e-05, "epoch": 2.6818181818181817, "percentage": 54.21, "elapsed_time": "0:40:40", "remaining_time": "0:34:21"}
|
| 104 |
+
{"current_steps": 104, "total_steps": 190, "loss": 0.3467, "lr": 2.0183716284894533e-05, "epoch": 2.707792207792208, "percentage": 54.74, "elapsed_time": "0:41:00", "remaining_time": "0:33:54"}
|
| 105 |
+
{"current_steps": 105, "total_steps": 190, "loss": 0.3482, "lr": 1.9816283715105474e-05, "epoch": 2.7337662337662336, "percentage": 55.26, "elapsed_time": "0:41:19", "remaining_time": "0:33:27"}
|
| 106 |
+
{"current_steps": 106, "total_steps": 190, "loss": 0.3545, "lr": 1.9448913152636765e-05, "epoch": 2.75974025974026, "percentage": 55.79, "elapsed_time": "0:41:39", "remaining_time": "0:33:00"}
|
| 107 |
+
{"current_steps": 107, "total_steps": 190, "loss": 0.3666, "lr": 1.9081728591200565e-05, "epoch": 2.7857142857142856, "percentage": 56.32, "elapsed_time": "0:42:00", "remaining_time": "0:32:35"}
|
| 108 |
+
{"current_steps": 108, "total_steps": 190, "loss": 0.344, "lr": 1.87148539617306e-05, "epoch": 2.811688311688312, "percentage": 56.84, "elapsed_time": "0:42:21", "remaining_time": "0:32:09"}
|
| 109 |
+
{"current_steps": 109, "total_steps": 190, "loss": 0.3387, "lr": 1.8348413090553356e-05, "epoch": 2.8376623376623376, "percentage": 57.37, "elapsed_time": "0:42:39", "remaining_time": "0:31:41"}
|
| 110 |
+
{"current_steps": 110, "total_steps": 190, "loss": 0.3604, "lr": 1.7982529657594637e-05, "epoch": 2.8636363636363638, "percentage": 57.89, "elapsed_time": "0:43:01", "remaining_time": "0:31:17"}
|
| 111 |
+
{"current_steps": 111, "total_steps": 190, "loss": 0.3363, "lr": 1.761732715463553e-05, "epoch": 2.8896103896103895, "percentage": 58.42, "elapsed_time": "0:43:19", "remaining_time": "0:30:50"}
|
| 112 |
+
{"current_steps": 112, "total_steps": 190, "loss": 0.3546, "lr": 1.7252928843631838e-05, "epoch": 2.9155844155844157, "percentage": 58.95, "elapsed_time": "0:43:39", "remaining_time": "0:30:24"}
|
| 113 |
+
{"current_steps": 113, "total_steps": 190, "loss": 0.3486, "lr": 1.6889457715111144e-05, "epoch": 2.9415584415584415, "percentage": 59.47, "elapsed_time": "0:44:08", "remaining_time": "0:30:04"}
|
| 114 |
+
{"current_steps": 114, "total_steps": 190, "loss": 0.3352, "lr": 1.6527036446661396e-05, "epoch": 2.9675324675324677, "percentage": 60.0, "elapsed_time": "0:44:28", "remaining_time": "0:29:39"}
|
| 115 |
+
{"current_steps": 115, "total_steps": 190, "loss": 0.3593, "lr": 1.6165787361525237e-05, "epoch": 2.9935064935064934, "percentage": 60.53, "elapsed_time": "0:44:51", "remaining_time": "0:29:15"}
|
| 116 |
+
{"current_steps": 116, "total_steps": 190, "loss": 0.2407, "lr": 1.5805832387313795e-05, "epoch": 3.022727272727273, "percentage": 61.05, "elapsed_time": "0:46:11", "remaining_time": "0:29:28"}
|
| 117 |
+
{"current_steps": 117, "total_steps": 190, "loss": 0.1911, "lr": 1.544729301485414e-05, "epoch": 3.0487012987012987, "percentage": 61.58, "elapsed_time": "0:46:30", "remaining_time": "0:29:01"}
|
| 118 |
+
{"current_steps": 118, "total_steps": 190, "loss": 0.1896, "lr": 1.5090290257184019e-05, "epoch": 3.074675324675325, "percentage": 62.11, "elapsed_time": "0:46:49", "remaining_time": "0:28:34"}
|
| 119 |
+
{"current_steps": 119, "total_steps": 190, "loss": 0.2093, "lr": 1.4734944608708022e-05, "epoch": 3.1006493506493507, "percentage": 62.63, "elapsed_time": "0:47:12", "remaining_time": "0:28:10"}
|
| 120 |
+
{"current_steps": 120, "total_steps": 190, "loss": 0.2057, "lr": 1.4381376004528616e-05, "epoch": 3.1266233766233764, "percentage": 63.16, "elapsed_time": "0:47:36", "remaining_time": "0:27:46"}
|
| 121 |
+
{"current_steps": 121, "total_steps": 190, "loss": 0.1884, "lr": 1.4029703779966116e-05, "epoch": 3.1525974025974026, "percentage": 63.68, "elapsed_time": "0:47:53", "remaining_time": "0:27:18"}
|