Training in progress, epoch 6
Browse files- model-00001-of-00014.safetensors +1 -1
- model-00002-of-00014.safetensors +1 -1
- model-00003-of-00014.safetensors +1 -1
- model-00004-of-00014.safetensors +1 -1
- model-00005-of-00014.safetensors +1 -1
- model-00006-of-00014.safetensors +1 -1
- model-00007-of-00014.safetensors +1 -1
- model-00008-of-00014.safetensors +1 -1
- model-00009-of-00014.safetensors +1 -1
- model-00010-of-00014.safetensors +1 -1
- model-00011-of-00014.safetensors +1 -1
- model-00012-of-00014.safetensors +1 -1
- model-00013-of-00014.safetensors +1 -1
- model-00014-of-00014.safetensors +1 -1
- trainer_log.jsonl +40 -0
model-00001-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4891730992
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6010c3932025f4568eb143d3f0e3fca015aa985410b86af4cd245eeedbb4042e
|
| 3 |
size 4891730992
|
model-00002-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059352
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5da985f22413e8503769440a44dd50b77537ae0511a1fb935106ecb9e9f7b214
|
| 3 |
size 4876059352
|
model-00003-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059384
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0d50f7d2b47a57c2084ba091c5cea46c82bbc66606c426a4392d691af32904b
|
| 3 |
size 4876059384
|
model-00004-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d68d7c5fd03a4b1be1528bb0d9176d5fc696e963fee140d1b9b7354bd8c359ec
|
| 3 |
size 4876059416
|
model-00005-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a357f9418f51c2d78df09fa03c7512c97848f71354aaf95714414711e81462a
|
| 3 |
size 4876059416
|
model-00006-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a67484f605266730a80cad1b910632fb3248515bbd4d2d3f4534f49dac83e21
|
| 3 |
size 4876059416
|
model-00007-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e443c31e3f3af4ad91a0198419a2ede8cc7625922781a6dc760b51142e3d1da
|
| 3 |
size 4876059416
|
model-00008-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59f2debb0b6a469ec4ce49c30f7440b655685738ebbcb32c8c04051328df8780
|
| 3 |
size 4876059416
|
model-00009-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d72fc8a34b9aa43926d7e82862bebb359ce4fb7daa4f97840a1e390d734ab899
|
| 3 |
size 4876059416
|
model-00010-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32d33c7415b852b204e087a4dccccba93701361132331f5c4c56158b5c1c01ad
|
| 3 |
size 4876059416
|
model-00011-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:edd28be8fa042b7e2af2a38f13e2ec5afacdcf814173e23db2192dabbe0cbded
|
| 3 |
size 4876059416
|
model-00012-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cddb7d84aa2109da78416c80e231e7ec280e2e057c19d3e1e4f977da36c207a
|
| 3 |
size 4876059416
|
model-00013-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f7bdcf685cd7c3f9049e0814301c3ecef7ad9e4bc2b1b91ec4569154e3db88d
|
| 3 |
size 4876059416
|
model-00014-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2123397800
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9810e7dab886dceffbbf245c30095a6f0aab89cd39b8763b63699a5d303121a4
|
| 3 |
size 2123397800
|
trainer_log.jsonl
CHANGED
|
@@ -29,3 +29,43 @@
|
|
| 29 |
{"current_steps": 29, "total_steps": 70, "loss": 0.3724, "lr": 1.4562106573531632e-05, "epoch": 2.761904761904762, "percentage": 41.43, "elapsed_time": "0:27:39", "remaining_time": "0:39:06"}
|
| 30 |
{"current_steps": 30, "total_steps": 70, "loss": 0.356, "lr": 1.4112871031306118e-05, "epoch": 2.857142857142857, "percentage": 42.86, "elapsed_time": "0:28:22", "remaining_time": "0:37:49"}
|
| 31 |
{"current_steps": 31, "total_steps": 70, "loss": 0.3729, "lr": 1.3653410243663953e-05, "epoch": 2.9523809523809526, "percentage": 44.29, "elapsed_time": "0:29:05", "remaining_time": "0:36:36"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
{"current_steps": 29, "total_steps": 70, "loss": 0.3724, "lr": 1.4562106573531632e-05, "epoch": 2.761904761904762, "percentage": 41.43, "elapsed_time": "0:27:39", "remaining_time": "0:39:06"}
|
| 30 |
{"current_steps": 30, "total_steps": 70, "loss": 0.356, "lr": 1.4112871031306118e-05, "epoch": 2.857142857142857, "percentage": 42.86, "elapsed_time": "0:28:22", "remaining_time": "0:37:49"}
|
| 31 |
{"current_steps": 31, "total_steps": 70, "loss": 0.3729, "lr": 1.3653410243663953e-05, "epoch": 2.9523809523809526, "percentage": 44.29, "elapsed_time": "0:29:05", "remaining_time": "0:36:36"}
|
| 32 |
+
{"current_steps": 32, "total_steps": 70, "loss": 0.3332, "lr": 1.3184866502516846e-05, "epoch": 3.0476190476190474, "percentage": 45.71, "elapsed_time": "0:34:00", "remaining_time": "0:40:23"}
|
| 33 |
+
{"current_steps": 33, "total_steps": 70, "loss": 0.3045, "lr": 1.2708404681430054e-05, "epoch": 3.142857142857143, "percentage": 47.14, "elapsed_time": "0:34:41", "remaining_time": "0:38:53"}
|
| 34 |
+
{"current_steps": 34, "total_steps": 70, "loss": 0.2815, "lr": 1.2225209339563144e-05, "epoch": 3.238095238095238, "percentage": 48.57, "elapsed_time": "0:35:24", "remaining_time": "0:37:29"}
|
| 35 |
+
{"current_steps": 35, "total_steps": 70, "loss": 0.2993, "lr": 1.1736481776669307e-05, "epoch": 3.3333333333333335, "percentage": 50.0, "elapsed_time": "0:36:00", "remaining_time": "0:36:00"}
|
| 36 |
+
{"current_steps": 36, "total_steps": 70, "loss": 0.2955, "lr": 1.1243437046474854e-05, "epoch": 3.4285714285714284, "percentage": 51.43, "elapsed_time": "0:36:47", "remaining_time": "0:34:45"}
|
| 37 |
+
{"current_steps": 37, "total_steps": 70, "loss": 0.2987, "lr": 1.0747300935864245e-05, "epoch": 3.5238095238095237, "percentage": 52.86, "elapsed_time": "0:37:29", "remaining_time": "0:33:26"}
|
| 38 |
+
{"current_steps": 38, "total_steps": 70, "loss": 0.2944, "lr": 1.0249306917380731e-05, "epoch": 3.619047619047619, "percentage": 54.29, "elapsed_time": "0:38:09", "remaining_time": "0:32:07"}
|
| 39 |
+
{"current_steps": 39, "total_steps": 70, "loss": 0.2769, "lr": 9.750693082619274e-06, "epoch": 3.7142857142857144, "percentage": 55.71, "elapsed_time": "0:38:49", "remaining_time": "0:30:51"}
|
| 40 |
+
{"current_steps": 40, "total_steps": 70, "loss": 0.3137, "lr": 9.252699064135759e-06, "epoch": 3.8095238095238093, "percentage": 57.14, "elapsed_time": "0:39:25", "remaining_time": "0:29:33"}
|
| 41 |
+
{"current_steps": 41, "total_steps": 70, "loss": 0.2652, "lr": 8.756562953525151e-06, "epoch": 3.9047619047619047, "percentage": 58.57, "elapsed_time": "0:40:05", "remaining_time": "0:28:21"}
|
| 42 |
+
{"current_steps": 42, "total_steps": 70, "loss": 0.2901, "lr": 8.263518223330698e-06, "epoch": 4.0, "percentage": 60.0, "elapsed_time": "0:40:47", "remaining_time": "0:27:11"}
|
| 43 |
+
{"current_steps": 43, "total_steps": 70, "loss": 0.2513, "lr": 7.774790660436857e-06, "epoch": 4.095238095238095, "percentage": 61.43, "elapsed_time": "0:44:48", "remaining_time": "0:28:08"}
|
| 44 |
+
{"current_steps": 44, "total_steps": 70, "loss": 0.2517, "lr": 7.291595318569951e-06, "epoch": 4.190476190476191, "percentage": 62.86, "elapsed_time": "0:45:29", "remaining_time": "0:26:53"}
|
| 45 |
+
{"current_steps": 45, "total_steps": 70, "loss": 0.2496, "lr": 6.815133497483157e-06, "epoch": 4.285714285714286, "percentage": 64.29, "elapsed_time": "0:46:16", "remaining_time": "0:25:42"}
|
| 46 |
+
{"current_steps": 46, "total_steps": 70, "loss": 0.2777, "lr": 6.34658975633605e-06, "epoch": 4.380952380952381, "percentage": 65.71, "elapsed_time": "0:47:00", "remaining_time": "0:24:31"}
|
| 47 |
+
{"current_steps": 47, "total_steps": 70, "loss": 0.2519, "lr": 5.887128968693887e-06, "epoch": 4.476190476190476, "percentage": 67.14, "elapsed_time": "0:47:39", "remaining_time": "0:23:19"}
|
| 48 |
+
{"current_steps": 48, "total_steps": 70, "loss": 0.228, "lr": 5.43789342646837e-06, "epoch": 4.571428571428571, "percentage": 68.57, "elapsed_time": "0:48:24", "remaining_time": "0:22:11"}
|
| 49 |
+
{"current_steps": 49, "total_steps": 70, "loss": 0.2454, "lr": 5.000000000000003e-06, "epoch": 4.666666666666667, "percentage": 70.0, "elapsed_time": "0:48:59", "remaining_time": "0:20:59"}
|
| 50 |
+
{"current_steps": 50, "total_steps": 70, "loss": 0.2234, "lr": 4.5745373613424075e-06, "epoch": 4.761904761904762, "percentage": 71.43, "elapsed_time": "0:49:41", "remaining_time": "0:19:52"}
|
| 51 |
+
{"current_steps": 51, "total_steps": 70, "loss": 0.2155, "lr": 4.162563277652104e-06, "epoch": 4.857142857142857, "percentage": 72.86, "elapsed_time": "0:50:19", "remaining_time": "0:18:44"}
|
| 52 |
+
{"current_steps": 52, "total_steps": 70, "loss": 0.2527, "lr": 3.7651019814126656e-06, "epoch": 4.9523809523809526, "percentage": 74.29, "elapsed_time": "0:50:56", "remaining_time": "0:17:38"}
|
| 53 |
+
{"current_steps": 53, "total_steps": 70, "loss": 0.2293, "lr": 3.3831416240314085e-06, "epoch": 5.0476190476190474, "percentage": 75.71, "elapsed_time": "0:54:35", "remaining_time": "0:17:30"}
|
| 54 |
+
{"current_steps": 54, "total_steps": 70, "loss": 0.2281, "lr": 3.017631819139273e-06, "epoch": 5.142857142857143, "percentage": 77.14, "elapsed_time": "0:55:15", "remaining_time": "0:16:22"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 70, "loss": 0.1992, "lr": 2.669481281701739e-06, "epoch": 5.238095238095238, "percentage": 78.57, "elapsed_time": "0:55:56", "remaining_time": "0:15:15"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 70, "loss": 0.178, "lr": 2.339555568810221e-06, "epoch": 5.333333333333333, "percentage": 80.0, "elapsed_time": "0:56:30", "remaining_time": "0:14:07"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 70, "loss": 0.2168, "lr": 2.0286749277707783e-06, "epoch": 5.428571428571429, "percentage": 81.43, "elapsed_time": "0:57:11", "remaining_time": "0:13:02"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 70, "loss": 0.2271, "lr": 1.7376122568400533e-06, "epoch": 5.523809523809524, "percentage": 82.86, "elapsed_time": "0:57:52", "remaining_time": "0:11:58"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 70, "loss": 0.2314, "lr": 1.467091183678444e-06, "epoch": 5.619047619047619, "percentage": 84.29, "elapsed_time": "0:58:31", "remaining_time": "0:10:54"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 70, "loss": 0.1739, "lr": 1.2177842662977136e-06, "epoch": 5.714285714285714, "percentage": 85.71, "elapsed_time": "0:59:08", "remaining_time": "0:09:51"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 70, "loss": 0.2262, "lr": 9.903113209758098e-07, "epoch": 5.809523809523809, "percentage": 87.14, "elapsed_time": "0:59:47", "remaining_time": "0:08:49"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 70, "loss": 0.225, "lr": 7.852378812959227e-07, "epoch": 5.904761904761905, "percentage": 88.57, "elapsed_time": "1:00:31", "remaining_time": "0:07:48"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 70, "loss": 0.2453, "lr": 6.030737921409169e-07, "epoch": 6.0, "percentage": 90.0, "elapsed_time": "1:01:16", "remaining_time": "0:06:48"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 70, "loss": 0.2161, "lr": 4.4427194213859216e-07, "epoch": 6.095238095238095, "percentage": 91.43, "elapsed_time": "1:03:59", "remaining_time": "0:05:59"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 70, "loss": 0.1761, "lr": 3.0922713770922155e-07, "epoch": 6.190476190476191, "percentage": 92.86, "elapsed_time": "1:04:47", "remaining_time": "0:04:59"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 70, "loss": 0.1877, "lr": 1.9827512151456175e-07, "epoch": 6.285714285714286, "percentage": 94.29, "elapsed_time": "1:05:26", "remaining_time": "0:03:57"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 70, "loss": 0.223, "lr": 1.1169173774871478e-07, "epoch": 6.380952380952381, "percentage": 95.71, "elapsed_time": "1:06:08", "remaining_time": "0:02:57"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 70, "loss": 0.2255, "lr": 4.9692246345985905e-08, "epoch": 6.476190476190476, "percentage": 97.14, "elapsed_time": "1:06:55", "remaining_time": "0:01:58"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 70, "loss": 0.2008, "lr": 1.2430787810776556e-08, "epoch": 6.571428571428571, "percentage": 98.57, "elapsed_time": "1:07:42", "remaining_time": "0:00:58"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 70, "loss": 0.2137, "lr": 0.0, "epoch": 6.666666666666667, "percentage": 100.0, "elapsed_time": "1:08:21", "remaining_time": "0:00:00"}
|
| 71 |
+
{"current_steps": 70, "total_steps": 70, "epoch": 6.666666666666667, "percentage": 100.0, "elapsed_time": "1:13:54", "remaining_time": "0:00:00"}
|