Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae8372ba8f6288205de9483178b0accd16a3c7386dfc92e560836c806c59c8cc
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:77511d7d0a6a3e40e347ce893ac93905fcd087968851600b8cfdf25904fc4da7
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56db0b0c8a64add581633f0ea3dd135310b0556fcbc6d1d09e2149a40cce0dbf
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c76f4ff81c21082ed12fcc3759c9402a939d6d91a79ce4b24fa76f5b5412d7f
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -52,3 +52,25 @@
|
|
| 52 |
{"current_steps": 52, "total_steps": 75, "loss": 0.8763, "lr": 2.636557474057173e-06, "epoch": 2.0064308681672025, "percentage": 69.33, "elapsed_time": "0:45:08", "remaining_time": "0:19:58"}
|
| 53 |
{"current_steps": 53, "total_steps": 75, "loss": 0.8473, "lr": 2.4326290324257896e-06, "epoch": 2.045016077170418, "percentage": 70.67, "elapsed_time": "0:46:09", "remaining_time": "0:19:09"}
|
| 54 |
{"current_steps": 54, "total_steps": 75, "loss": 0.7919, "lr": 2.234344229374003e-06, "epoch": 2.0836012861736335, "percentage": 72.0, "elapsed_time": "0:47:01", "remaining_time": "0:18:17"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 52 |
{"current_steps": 52, "total_steps": 75, "loss": 0.8763, "lr": 2.636557474057173e-06, "epoch": 2.0064308681672025, "percentage": 69.33, "elapsed_time": "0:45:08", "remaining_time": "0:19:58"}
|
| 53 |
{"current_steps": 53, "total_steps": 75, "loss": 0.8473, "lr": 2.4326290324257896e-06, "epoch": 2.045016077170418, "percentage": 70.67, "elapsed_time": "0:46:09", "remaining_time": "0:19:09"}
|
| 54 |
{"current_steps": 54, "total_steps": 75, "loss": 0.7919, "lr": 2.234344229374003e-06, "epoch": 2.0836012861736335, "percentage": 72.0, "elapsed_time": "0:47:01", "remaining_time": "0:18:17"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 75, "loss": 0.8196, "lr": 2.042138937932388e-06, "epoch": 2.122186495176849, "percentage": 73.33, "elapsed_time": "0:47:50", "remaining_time": "0:17:23"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 75, "loss": 0.7881, "lr": 1.856435667045577e-06, "epoch": 2.1607717041800645, "percentage": 74.67, "elapsed_time": "0:48:34", "remaining_time": "0:16:28"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 75, "loss": 0.8631, "lr": 1.677642632805892e-06, "epoch": 2.19935691318328, "percentage": 76.0, "elapsed_time": "0:49:29", "remaining_time": "0:15:37"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 75, "loss": 0.7746, "lr": 1.5061528611057917e-06, "epoch": 2.237942122186495, "percentage": 77.33, "elapsed_time": "0:50:13", "remaining_time": "0:14:43"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 75, "loss": 0.8119, "lr": 1.3423433236816563e-06, "epoch": 2.2765273311897105, "percentage": 78.67, "elapsed_time": "0:51:06", "remaining_time": "0:13:51"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 75, "loss": 0.8375, "lr": 1.186574109448091e-06, "epoch": 2.315112540192926, "percentage": 80.0, "elapsed_time": "0:51:52", "remaining_time": "0:12:58"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 75, "loss": 0.7619, "lr": 1.0391876329443534e-06, "epoch": 2.3536977491961415, "percentage": 81.33, "elapsed_time": "0:52:36", "remaining_time": "0:12:04"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 75, "loss": 0.8132, "lr": 9.005078816328772e-07, "epoch": 2.392282958199357, "percentage": 82.67, "elapsed_time": "0:53:34", "remaining_time": "0:11:13"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 75, "loss": 0.7784, "lr": 7.708397037045129e-07, "epoch": 2.4308681672025725, "percentage": 84.0, "elapsed_time": "0:54:23", "remaining_time": "0:10:21"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 75, "loss": 0.8832, "lr": 6.50468137956049e-07, "epoch": 2.469453376205788, "percentage": 85.33, "elapsed_time": "0:55:16", "remaining_time": "0:09:29"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 75, "loss": 0.8102, "lr": 5.396577872130676e-07, "epoch": 2.508038585209003, "percentage": 86.67, "elapsed_time": "0:56:07", "remaining_time": "0:08:38"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 75, "loss": 0.7881, "lr": 4.386522366755169e-07, "epoch": 2.5466237942122185, "percentage": 88.0, "elapsed_time": "0:57:00", "remaining_time": "0:07:46"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 75, "loss": 0.8807, "lr": 3.4767351846456744e-07, "epoch": 2.585209003215434, "percentage": 89.33, "elapsed_time": "0:57:53", "remaining_time": "0:06:54"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 75, "loss": 0.7756, "lr": 2.669216235478295e-07, "epoch": 2.6237942122186495, "percentage": 90.67, "elapsed_time": "0:58:42", "remaining_time": "0:06:02"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 75, "loss": 0.8685, "lr": 1.9657406211579966e-07, "epoch": 2.662379421221865, "percentage": 92.0, "elapsed_time": "0:59:29", "remaining_time": "0:05:10"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 75, "loss": 0.7501, "lr": 1.3678547337593494e-07, "epoch": 2.7009646302250805, "percentage": 93.33, "elapsed_time": "1:00:09", "remaining_time": "0:04:17"}
|
| 71 |
+
{"current_steps": 71, "total_steps": 75, "loss": 0.8121, "lr": 8.768728562211948e-08, "epoch": 2.739549839228296, "percentage": 94.67, "elapsed_time": "1:00:59", "remaining_time": "0:03:26"}
|
| 72 |
+
{"current_steps": 72, "total_steps": 75, "loss": 0.7776, "lr": 4.9387427326745287e-08, "epoch": 2.778135048231511, "percentage": 96.0, "elapsed_time": "1:01:41", "remaining_time": "0:02:34"}
|
| 73 |
+
{"current_steps": 73, "total_steps": 75, "loss": 0.8149, "lr": 2.1970089890509527e-08, "epoch": 2.816720257234727, "percentage": 97.33, "elapsed_time": "1:02:33", "remaining_time": "0:01:42"}
|
| 74 |
+
{"current_steps": 74, "total_steps": 75, "loss": 0.8291, "lr": 5.495542571443135e-09, "epoch": 2.855305466237942, "percentage": 98.67, "elapsed_time": "1:03:23", "remaining_time": "0:00:51"}
|
| 75 |
+
{"current_steps": 75, "total_steps": 75, "loss": 0.8268, "lr": 0.0, "epoch": 2.8938906752411575, "percentage": 100.0, "elapsed_time": "1:04:05", "remaining_time": "0:00:00"}
|
| 76 |
+
{"current_steps": 75, "total_steps": 75, "epoch": 2.8938906752411575, "percentage": 100.0, "elapsed_time": "1:06:12", "remaining_time": "0:00:00"}
|