Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5640feb9ce63d00217e08262b97b74fc945e26c70aacdef2131ffd47f158192b
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec25a652cbda1b84f04f4ec3592e555dd2cd2431fe58a48244378cf01cd918d3
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c794e3203c7d04155566418905c7e4dc2527ae0843cb5d74ddecb7e96f17de78
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73c8c1555f87907649eaa4618089a46566a0d7cf6d6d1d20c21d3cfb6f482f03
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -21,3 +21,24 @@
|
|
| 21 |
{"current_steps": 21, "total_steps": 60, "loss": 1.2317, "lr": 8.213938048432697e-06, "epoch": 1.016, "percentage": 35.0, "elapsed_time": "0:20:43", "remaining_time": "0:38:29"}
|
| 22 |
{"current_steps": 22, "total_steps": 60, "loss": 0.8934, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:21:38", "remaining_time": "0:37:23"}
|
| 23 |
{"current_steps": 23, "total_steps": 60, "loss": 0.991, "lr": 7.747544890354031e-06, "epoch": 1.112, "percentage": 38.33, "elapsed_time": "0:22:33", "remaining_time": "0:36:16"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
{"current_steps": 21, "total_steps": 60, "loss": 1.2317, "lr": 8.213938048432697e-06, "epoch": 1.016, "percentage": 35.0, "elapsed_time": "0:20:43", "remaining_time": "0:38:29"}
|
| 22 |
{"current_steps": 22, "total_steps": 60, "loss": 0.8934, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:21:38", "remaining_time": "0:37:23"}
|
| 23 |
{"current_steps": 23, "total_steps": 60, "loss": 0.991, "lr": 7.747544890354031e-06, "epoch": 1.112, "percentage": 38.33, "elapsed_time": "0:22:33", "remaining_time": "0:36:16"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 60, "loss": 0.9389, "lr": 7.500000000000001e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:23:27", "remaining_time": "0:35:11"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 60, "loss": 0.86, "lr": 7.243995901002312e-06, "epoch": 1.208, "percentage": 41.67, "elapsed_time": "0:24:25", "remaining_time": "0:34:11"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 60, "loss": 0.9331, "lr": 6.980398830195785e-06, "epoch": 1.256, "percentage": 43.33, "elapsed_time": "0:25:21", "remaining_time": "0:33:09"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 60, "loss": 0.9881, "lr": 6.710100716628345e-06, "epoch": 1.304, "percentage": 45.0, "elapsed_time": "0:26:13", "remaining_time": "0:32:02"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 60, "loss": 0.9337, "lr": 6.434016163555452e-06, "epoch": 1.3519999999999999, "percentage": 46.67, "elapsed_time": "0:27:11", "remaining_time": "0:31:04"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 60, "loss": 0.8651, "lr": 6.153079353712201e-06, "epoch": 1.4, "percentage": 48.33, "elapsed_time": "0:28:07", "remaining_time": "0:30:04"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 60, "loss": 0.8596, "lr": 5.8682408883346535e-06, "epoch": 1.448, "percentage": 50.0, "elapsed_time": "0:28:57", "remaining_time": "0:28:57"}
|
| 31 |
+
{"current_steps": 31, "total_steps": 60, "loss": 0.8963, "lr": 5.5804645706261515e-06, "epoch": 1.496, "percentage": 51.67, "elapsed_time": "0:29:55", "remaining_time": "0:27:59"}
|
| 32 |
+
{"current_steps": 32, "total_steps": 60, "loss": 0.8475, "lr": 5.290724144552379e-06, "epoch": 1.544, "percentage": 53.33, "elapsed_time": "0:30:43", "remaining_time": "0:26:53"}
|
| 33 |
+
{"current_steps": 33, "total_steps": 60, "loss": 0.8904, "lr": 5e-06, "epoch": 1.592, "percentage": 55.0, "elapsed_time": "0:31:36", "remaining_time": "0:25:51"}
|
| 34 |
+
{"current_steps": 34, "total_steps": 60, "loss": 0.9363, "lr": 4.7092758554476215e-06, "epoch": 1.6400000000000001, "percentage": 56.67, "elapsed_time": "0:32:29", "remaining_time": "0:24:50"}
|
| 35 |
+
{"current_steps": 35, "total_steps": 60, "loss": 0.9859, "lr": 4.4195354293738484e-06, "epoch": 1.688, "percentage": 58.33, "elapsed_time": "0:33:32", "remaining_time": "0:23:57"}
|
| 36 |
+
{"current_steps": 36, "total_steps": 60, "loss": 0.7657, "lr": 4.131759111665349e-06, "epoch": 1.736, "percentage": 60.0, "elapsed_time": "0:34:22", "remaining_time": "0:22:55"}
|
| 37 |
+
{"current_steps": 37, "total_steps": 60, "loss": 0.9692, "lr": 3.8469206462878e-06, "epoch": 1.784, "percentage": 61.67, "elapsed_time": "0:35:21", "remaining_time": "0:21:58"}
|
| 38 |
+
{"current_steps": 38, "total_steps": 60, "loss": 0.894, "lr": 3.5659838364445505e-06, "epoch": 1.8319999999999999, "percentage": 63.33, "elapsed_time": "0:36:17", "remaining_time": "0:21:00"}
|
| 39 |
+
{"current_steps": 39, "total_steps": 60, "loss": 1.0476, "lr": 3.289899283371657e-06, "epoch": 1.88, "percentage": 65.0, "elapsed_time": "0:37:21", "remaining_time": "0:20:07"}
|
| 40 |
+
{"current_steps": 40, "total_steps": 60, "loss": 0.7547, "lr": 3.019601169804216e-06, "epoch": 1.928, "percentage": 66.67, "elapsed_time": "0:38:14", "remaining_time": "0:19:07"}
|
| 41 |
+
{"current_steps": 41, "total_steps": 60, "loss": 1.0386, "lr": 2.7560040989976894e-06, "epoch": 1.976, "percentage": 68.33, "elapsed_time": "0:39:11", "remaining_time": "0:18:09"}
|
| 42 |
+
{"current_steps": 42, "total_steps": 60, "loss": 1.0944, "lr": 2.5000000000000015e-06, "epoch": 2.032, "percentage": 70.0, "elapsed_time": "0:41:17", "remaining_time": "0:17:41"}
|
| 43 |
+
{"current_steps": 43, "total_steps": 60, "loss": 0.7287, "lr": 2.2524551096459703e-06, "epoch": 2.08, "percentage": 71.67, "elapsed_time": "0:42:03", "remaining_time": "0:16:37"}
|
| 44 |
+
{"current_steps": 44, "total_steps": 60, "loss": 0.9188, "lr": 2.0142070414860704e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:43:00", "remaining_time": "0:15:38"}
|