Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9e04223a6687bf7fdcfdbbe17cbe9fe106cb8b95be27f96cb60d371cbcc5d60
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:baf6cf193c9acac175f00684e128a834b45c01bd9dd5cb49f4a82ffc2066182f
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56d037ab17f1b97694fae20771f34532e17ff58b6d63ec8cafc5f6b50d163a1d
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a0b899e917afbb09e6ad8818ccd2e3fe9e88df5a87082ca4cd84f25b1c80067
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -36,3 +36,34 @@
|
|
| 36 |
{"current_steps": 36, "total_steps": 117, "loss": 0.3401, "lr": 8.765357330018056e-06, "epoch": 3.759493670886076, "percentage": 30.77, "elapsed_time": "0:14:29", "remaining_time": "0:32:36"}
|
| 37 |
{"current_steps": 37, "total_steps": 117, "loss": 0.3731, "lr": 8.665259359149132e-06, "epoch": 3.8607594936708862, "percentage": 31.62, "elapsed_time": "0:14:52", "remaining_time": "0:32:09"}
|
| 38 |
{"current_steps": 38, "total_steps": 117, "loss": 0.3556, "lr": 8.561880484756726e-06, "epoch": 3.962025316455696, "percentage": 32.48, "elapsed_time": "0:15:17", "remaining_time": "0:31:47"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
{"current_steps": 36, "total_steps": 117, "loss": 0.3401, "lr": 8.765357330018056e-06, "epoch": 3.759493670886076, "percentage": 30.77, "elapsed_time": "0:14:29", "remaining_time": "0:32:36"}
|
| 37 |
{"current_steps": 37, "total_steps": 117, "loss": 0.3731, "lr": 8.665259359149132e-06, "epoch": 3.8607594936708862, "percentage": 31.62, "elapsed_time": "0:14:52", "remaining_time": "0:32:09"}
|
| 38 |
{"current_steps": 38, "total_steps": 117, "loss": 0.3556, "lr": 8.561880484756726e-06, "epoch": 3.962025316455696, "percentage": 32.48, "elapsed_time": "0:15:17", "remaining_time": "0:31:47"}
|
| 39 |
+
{"current_steps": 39, "total_steps": 117, "loss": 0.3495, "lr": 8.455313244934324e-06, "epoch": 4.10126582278481, "percentage": 33.33, "elapsed_time": "0:16:21", "remaining_time": "0:32:42"}
|
| 40 |
+
{"current_steps": 40, "total_steps": 117, "loss": 0.2985, "lr": 8.345653031794292e-06, "epoch": 4.2025316455696204, "percentage": 34.19, "elapsed_time": "0:16:42", "remaining_time": "0:32:09"}
|
| 41 |
+
{"current_steps": 41, "total_steps": 117, "loss": 0.3125, "lr": 8.232998006078998e-06, "epoch": 4.30379746835443, "percentage": 35.04, "elapsed_time": "0:16:57", "remaining_time": "0:31:25"}
|
| 42 |
+
{"current_steps": 42, "total_steps": 117, "loss": 0.2084, "lr": 8.117449009293668e-06, "epoch": 4.405063291139241, "percentage": 35.9, "elapsed_time": "0:17:17", "remaining_time": "0:30:52"}
|
| 43 |
+
{"current_steps": 43, "total_steps": 117, "loss": 0.2719, "lr": 7.99910947343957e-06, "epoch": 4.506329113924051, "percentage": 36.75, "elapsed_time": "0:17:41", "remaining_time": "0:30:26"}
|
| 44 |
+
{"current_steps": 44, "total_steps": 117, "loss": 0.2179, "lr": 7.87808532842837e-06, "epoch": 4.6075949367088604, "percentage": 37.61, "elapsed_time": "0:17:56", "remaining_time": "0:29:46"}
|
| 45 |
+
{"current_steps": 45, "total_steps": 117, "loss": 0.2132, "lr": 7.754484907260513e-06, "epoch": 4.708860759493671, "percentage": 38.46, "elapsed_time": "0:18:14", "remaining_time": "0:29:10"}
|
| 46 |
+
{"current_steps": 46, "total_steps": 117, "loss": 0.2101, "lr": 7.628418849052523e-06, "epoch": 4.810126582278481, "percentage": 39.32, "elapsed_time": "0:18:30", "remaining_time": "0:28:33"}
|
| 47 |
+
{"current_steps": 47, "total_steps": 117, "loss": 0.2558, "lr": 7.500000000000001e-06, "epoch": 4.911392405063291, "percentage": 40.17, "elapsed_time": "0:18:57", "remaining_time": "0:28:14"}
|
| 48 |
+
{"current_steps": 48, "total_steps": 117, "loss": 0.2486, "lr": 7.369343312364994e-06, "epoch": 5.050632911392405, "percentage": 41.03, "elapsed_time": "0:20:11", "remaining_time": "0:29:01"}
|
| 49 |
+
{"current_steps": 49, "total_steps": 117, "loss": 0.1955, "lr": 7.236565741578163e-06, "epoch": 5.151898734177215, "percentage": 41.88, "elapsed_time": "0:20:30", "remaining_time": "0:28:28"}
|
| 50 |
+
{"current_steps": 50, "total_steps": 117, "loss": 0.186, "lr": 7.101786141547829e-06, "epoch": 5.253164556962025, "percentage": 42.74, "elapsed_time": "0:20:55", "remaining_time": "0:28:01"}
|
| 51 |
+
{"current_steps": 51, "total_steps": 117, "loss": 0.2063, "lr": 6.965125158269619e-06, "epoch": 5.3544303797468356, "percentage": 43.59, "elapsed_time": "0:21:16", "remaining_time": "0:27:31"}
|
| 52 |
+
{"current_steps": 52, "total_steps": 117, "loss": 0.1844, "lr": 6.8267051218319766e-06, "epoch": 5.455696202531645, "percentage": 44.44, "elapsed_time": "0:21:39", "remaining_time": "0:27:04"}
|
| 53 |
+
{"current_steps": 53, "total_steps": 117, "loss": 0.2212, "lr": 6.686649936914151e-06, "epoch": 5.556962025316456, "percentage": 45.3, "elapsed_time": "0:22:00", "remaining_time": "0:26:34"}
|
| 54 |
+
{"current_steps": 54, "total_steps": 117, "loss": 0.2044, "lr": 6.545084971874738e-06, "epoch": 5.658227848101266, "percentage": 46.15, "elapsed_time": "0:22:26", "remaining_time": "0:26:10"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 117, "loss": 0.158, "lr": 6.402136946530014e-06, "epoch": 5.759493670886076, "percentage": 47.01, "elapsed_time": "0:22:44", "remaining_time": "0:25:38"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 117, "loss": 0.2431, "lr": 6.257933818722544e-06, "epoch": 5.860759493670886, "percentage": 47.86, "elapsed_time": "0:23:04", "remaining_time": "0:25:08"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 117, "loss": 0.2224, "lr": 6.112604669781572e-06, "epoch": 5.962025316455696, "percentage": 48.72, "elapsed_time": "0:23:25", "remaining_time": "0:24:39"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 117, "loss": 0.1807, "lr": 5.9662795889777666e-06, "epoch": 6.10126582278481, "percentage": 49.57, "elapsed_time": "0:24:41", "remaining_time": "0:25:07"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 117, "loss": 0.1659, "lr": 5.819089557075689e-06, "epoch": 6.2025316455696204, "percentage": 50.43, "elapsed_time": "0:25:02", "remaining_time": "0:24:36"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 117, "loss": 0.1562, "lr": 5.671166329088278e-06, "epoch": 6.30379746835443, "percentage": 51.28, "elapsed_time": "0:25:24", "remaining_time": "0:24:08"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 117, "loss": 0.0946, "lr": 5.522642316338268e-06, "epoch": 6.405063291139241, "percentage": 52.14, "elapsed_time": "0:25:37", "remaining_time": "0:23:31"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 117, "loss": 0.1981, "lr": 5.373650467932122e-06, "epoch": 6.506329113924051, "percentage": 52.99, "elapsed_time": "0:25:59", "remaining_time": "0:23:03"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 117, "loss": 0.1124, "lr": 5.224324151752575e-06, "epoch": 6.6075949367088604, "percentage": 53.85, "elapsed_time": "0:26:15", "remaining_time": "0:22:30"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 117, "loss": 0.1542, "lr": 5.074797035076319e-06, "epoch": 6.708860759493671, "percentage": 54.7, "elapsed_time": "0:26:32", "remaining_time": "0:21:58"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 117, "loss": 0.1885, "lr": 4.9252029649236835e-06, "epoch": 6.810126582278481, "percentage": 55.56, "elapsed_time": "0:27:01", "remaining_time": "0:21:36"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 117, "loss": 0.129, "lr": 4.775675848247427e-06, "epoch": 6.911392405063291, "percentage": 56.41, "elapsed_time": "0:27:21", "remaining_time": "0:21:08"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 117, "loss": 0.0944, "lr": 4.626349532067879e-06, "epoch": 7.050632911392405, "percentage": 57.26, "elapsed_time": "0:28:29", "remaining_time": "0:21:15"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 117, "loss": 0.1655, "lr": 4.477357683661734e-06, "epoch": 7.151898734177215, "percentage": 58.12, "elapsed_time": "0:28:59", "remaining_time": "0:20:53"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 117, "loss": 0.081, "lr": 4.3288336709117246e-06, "epoch": 7.253164556962025, "percentage": 58.97, "elapsed_time": "0:29:13", "remaining_time": "0:20:20"}
|