Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14dcd3faec9b3e627bec90c775a2820035a9815985f0c9ea7f527ffb8044d6b9
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b6c4c297dfb691cec0fa1e1bbfe1ff423719f6c3a235c6f789b781cd29d1825
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fe6e62cece3520992478d058f61e6b18b98a77dde4ba2140819a8229154af3f
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d28395a5f22becae37590f334d1dc2edbfe5c69a4b58815de13f8c19d7f8eaaa
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -23,3 +23,9 @@
|
|
| 23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.6867, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:17:04", "remaining_time": "0:05:11"}
|
| 24 |
{"current_steps": 24, "total_steps": 30, "loss": 0.7337, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:17:37", "remaining_time": "0:04:24"}
|
| 25 |
{"current_steps": 25, "total_steps": 30, "loss": 0.8412, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:18:25", "remaining_time": "0:03:41"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.6867, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:17:04", "remaining_time": "0:05:11"}
|
| 24 |
{"current_steps": 24, "total_steps": 30, "loss": 0.7337, "lr": 1.1697777844051105e-06, "epoch": 2.2857142857142856, "percentage": 80.0, "elapsed_time": "0:17:37", "remaining_time": "0:04:24"}
|
| 25 |
{"current_steps": 25, "total_steps": 30, "loss": 0.8412, "lr": 8.225609429353187e-07, "epoch": 2.380952380952381, "percentage": 83.33, "elapsed_time": "0:18:25", "remaining_time": "0:03:41"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 30, "loss": 0.7219, "lr": 5.318367983829393e-07, "epoch": 2.4761904761904763, "percentage": 86.67, "elapsed_time": "0:19:00", "remaining_time": "0:02:55"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 30, "loss": 0.7787, "lr": 3.015368960704584e-07, "epoch": 2.571428571428571, "percentage": 90.0, "elapsed_time": "0:19:49", "remaining_time": "0:02:12"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 30, "loss": 0.8023, "lr": 1.3477564710088097e-07, "epoch": 2.6666666666666665, "percentage": 93.33, "elapsed_time": "0:20:25", "remaining_time": "0:01:27"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 30, "loss": 0.7005, "lr": 3.3808211290284886e-08, "epoch": 2.761904761904762, "percentage": 96.67, "elapsed_time": "0:21:00", "remaining_time": "0:00:43"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 30, "loss": 0.7909, "lr": 0.0, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:21:50", "remaining_time": "0:00:00"}
|
| 31 |
+
{"current_steps": 30, "total_steps": 30, "epoch": 2.857142857142857, "percentage": 100.0, "elapsed_time": "0:23:30", "remaining_time": "0:00:00"}
|