Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1f812cb2baefb2f9e5931822ac4ca348415efadb75bf52b17417eec7cca99b0
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:072f934323edbeddb17aeac5672dcaf8051f58c1b19ce7ccabbbfc1fc411afa3
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d416ded1a38e27bd0316164e5e5122428651f8367044de25dc19d7d264eeac8
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28acbad9b36b9454b383695edcc7b4e40156b0d2bf991a9a80a96de19c8a48f0
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -45,3 +45,26 @@
|
|
| 45 |
{"current_steps": 45, "total_steps": 69, "loss": 0.4696, "lr": 1.3053894943103598e-05, "epoch": 1.9253333333333333, "percentage": 65.22, "elapsed_time": "1:35:57", "remaining_time": "0:51:10"}
|
| 46 |
{"current_steps": 46, "total_steps": 69, "loss": 0.4505, "lr": 1.2112882897733634e-05, "epoch": 1.968, "percentage": 66.67, "elapsed_time": "1:38:10", "remaining_time": "0:49:05"}
|
| 47 |
{"current_steps": 47, "total_steps": 69, "loss": 0.7496, "lr": 1.1192116968847313e-05, "epoch": 2.016, "percentage": 68.12, "elapsed_time": "1:41:22", "remaining_time": "0:47:27"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 45 |
{"current_steps": 45, "total_steps": 69, "loss": 0.4696, "lr": 1.3053894943103598e-05, "epoch": 1.9253333333333333, "percentage": 65.22, "elapsed_time": "1:35:57", "remaining_time": "0:51:10"}
|
| 46 |
{"current_steps": 46, "total_steps": 69, "loss": 0.4505, "lr": 1.2112882897733634e-05, "epoch": 1.968, "percentage": 66.67, "elapsed_time": "1:38:10", "remaining_time": "0:49:05"}
|
| 47 |
{"current_steps": 47, "total_steps": 69, "loss": 0.7496, "lr": 1.1192116968847313e-05, "epoch": 2.016, "percentage": 68.12, "elapsed_time": "1:41:22", "remaining_time": "0:47:27"}
|
| 48 |
+
{"current_steps": 48, "total_steps": 69, "loss": 0.3822, "lr": 1.0293960749378384e-05, "epoch": 2.058666666666667, "percentage": 69.57, "elapsed_time": "1:43:26", "remaining_time": "0:45:15"}
|
| 49 |
+
{"current_steps": 49, "total_steps": 69, "loss": 0.4408, "lr": 9.420719793460758e-06, "epoch": 2.1013333333333333, "percentage": 71.01, "elapsed_time": "1:45:37", "remaining_time": "0:43:06"}
|
| 50 |
+
{"current_steps": 50, "total_steps": 69, "loss": 0.399, "lr": 8.57463569810415e-06, "epoch": 2.144, "percentage": 72.46, "elapsed_time": "1:47:39", "remaining_time": "0:40:54"}
|
| 51 |
+
{"current_steps": 51, "total_steps": 69, "loss": 0.4757, "lr": 7.757880349046742e-06, "epoch": 2.1866666666666665, "percentage": 73.91, "elapsed_time": "1:49:50", "remaining_time": "0:38:46"}
|
| 52 |
+
{"current_steps": 52, "total_steps": 69, "loss": 0.3849, "lr": 6.97255034555556e-06, "epoch": 2.2293333333333334, "percentage": 75.36, "elapsed_time": "1:51:44", "remaining_time": "0:36:31"}
|
| 53 |
+
{"current_steps": 53, "total_steps": 69, "loss": 0.4188, "lr": 6.220661618486268e-06, "epoch": 2.2720000000000002, "percentage": 76.81, "elapsed_time": "1:53:44", "remaining_time": "0:34:20"}
|
| 54 |
+
{"current_steps": 54, "total_steps": 69, "loss": 0.4086, "lr": 5.504144255417605e-06, "epoch": 2.3146666666666667, "percentage": 78.26, "elapsed_time": "1:55:46", "remaining_time": "0:32:09"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 69, "loss": 0.4171, "lr": 4.824837546144183e-06, "epoch": 2.3573333333333335, "percentage": 79.71, "elapsed_time": "1:57:44", "remaining_time": "0:29:58"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 69, "loss": 0.4112, "lr": 4.184485261246032e-06, "epoch": 2.4, "percentage": 81.16, "elapsed_time": "1:59:51", "remaining_time": "0:27:49"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 69, "loss": 0.3784, "lr": 3.584731175854479e-06, "epoch": 2.4426666666666668, "percentage": 82.61, "elapsed_time": "2:01:49", "remaining_time": "0:25:38"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 69, "loss": 0.407, "lr": 3.0271148501049796e-06, "epoch": 2.485333333333333, "percentage": 84.06, "elapsed_time": "2:04:05", "remaining_time": "0:23:32"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 69, "loss": 0.4113, "lr": 2.5130676771083585e-06, "epoch": 2.528, "percentage": 85.51, "elapsed_time": "2:06:18", "remaining_time": "0:21:24"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 69, "loss": 0.3725, "lr": 2.0439092085851685e-06, "epoch": 2.570666666666667, "percentage": 86.96, "elapsed_time": "2:08:25", "remaining_time": "0:19:15"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 69, "loss": 0.3891, "lr": 1.620843767595388e-06, "epoch": 2.6133333333333333, "percentage": 88.41, "elapsed_time": "2:10:22", "remaining_time": "0:17:05"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 69, "loss": 0.3877, "lr": 1.244957357058394e-06, "epoch": 2.656, "percentage": 89.86, "elapsed_time": "2:12:19", "remaining_time": "0:14:56"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 69, "loss": 0.3701, "lr": 9.172148719990237e-07, "epoch": 2.6986666666666665, "percentage": 91.3, "elapsed_time": "2:14:10", "remaining_time": "0:12:46"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 69, "loss": 0.4496, "lr": 6.384576226759165e-07, "epoch": 2.7413333333333334, "percentage": 92.75, "elapsed_time": "2:16:16", "remaining_time": "0:10:38"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 69, "loss": 0.3378, "lr": 4.094011749501103e-07, "epoch": 2.784, "percentage": 94.2, "elapsed_time": "2:18:08", "remaining_time": "0:08:30"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 69, "loss": 0.4265, "lr": 2.3063351343777241e-07, "epoch": 2.8266666666666667, "percentage": 95.65, "elapsed_time": "2:20:20", "remaining_time": "0:06:22"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 69, "loss": 0.385, "lr": 1.0261353216209691e-07, "epoch": 2.8693333333333335, "percentage": 97.1, "elapsed_time": "2:22:22", "remaining_time": "0:04:14"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 69, "loss": 0.4118, "lr": 2.566985657894483e-08, "epoch": 2.912, "percentage": 98.55, "elapsed_time": "2:24:24", "remaining_time": "0:02:07"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 69, "loss": 0.4309, "lr": 0.0, "epoch": 2.9546666666666668, "percentage": 100.0, "elapsed_time": "2:26:55", "remaining_time": "0:00:00"}
|
| 70 |
+
{"current_steps": 69, "total_steps": 69, "epoch": 2.9546666666666668, "percentage": 100.0, "elapsed_time": "2:29:12", "remaining_time": "0:00:00"}
|