Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3a0e21f835d20ee9602a0e13df413aedc22a2a520dbf06eac084cf053b39476
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f39b3588e51d2e098b0ff554990b4ca72ad1a0b5e110adc39f62645c6a0deb50
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ee5304d913e4cac863e9ba090d781734ffdef6c9cae4c385366422505c4eb58
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ede2dd636e3e2795e8b01d3147b5cb8d3df80bfdbc8475a1590d31615dcc9427
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -22,3 +22,13 @@
|
|
| 22 |
{"current_steps": 200, "total_steps": 300, "eval_loss": 0.9496641159057617, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:21:26", "remaining_time": "0:10:43"}
|
| 23 |
{"current_steps": 210, "total_steps": 300, "loss": 0.8388, "learning_rate": 5e-06, "epoch": 2.1, "percentage": 70.0, "elapsed_time": "0:24:10", "remaining_time": "0:10:21"}
|
| 24 |
{"current_steps": 220, "total_steps": 300, "loss": 0.8356, "learning_rate": 5e-06, "epoch": 2.2, "percentage": 73.33, "elapsed_time": "0:25:08", "remaining_time": "0:09:08"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 22 |
{"current_steps": 200, "total_steps": 300, "eval_loss": 0.9496641159057617, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:21:26", "remaining_time": "0:10:43"}
|
| 23 |
{"current_steps": 210, "total_steps": 300, "loss": 0.8388, "learning_rate": 5e-06, "epoch": 2.1, "percentage": 70.0, "elapsed_time": "0:24:10", "remaining_time": "0:10:21"}
|
| 24 |
{"current_steps": 220, "total_steps": 300, "loss": 0.8356, "learning_rate": 5e-06, "epoch": 2.2, "percentage": 73.33, "elapsed_time": "0:25:08", "remaining_time": "0:09:08"}
|
| 25 |
+
{"current_steps": 230, "total_steps": 300, "loss": 0.838, "learning_rate": 5e-06, "epoch": 2.3, "percentage": 76.67, "elapsed_time": "0:26:07", "remaining_time": "0:07:57"}
|
| 26 |
+
{"current_steps": 240, "total_steps": 300, "loss": 0.8426, "learning_rate": 5e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "0:27:07", "remaining_time": "0:06:46"}
|
| 27 |
+
{"current_steps": 250, "total_steps": 300, "loss": 0.845, "learning_rate": 5e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "0:28:06", "remaining_time": "0:05:37"}
|
| 28 |
+
{"current_steps": 260, "total_steps": 300, "loss": 0.8307, "learning_rate": 5e-06, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "0:29:05", "remaining_time": "0:04:28"}
|
| 29 |
+
{"current_steps": 270, "total_steps": 300, "loss": 0.8391, "learning_rate": 5e-06, "epoch": 2.7, "percentage": 90.0, "elapsed_time": "0:30:04", "remaining_time": "0:03:20"}
|
| 30 |
+
{"current_steps": 280, "total_steps": 300, "loss": 0.8426, "learning_rate": 5e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "0:31:04", "remaining_time": "0:02:13"}
|
| 31 |
+
{"current_steps": 290, "total_steps": 300, "loss": 0.8447, "learning_rate": 5e-06, "epoch": 2.9, "percentage": 96.67, "elapsed_time": "0:32:03", "remaining_time": "0:01:06"}
|
| 32 |
+
{"current_steps": 300, "total_steps": 300, "loss": 0.841, "learning_rate": 5e-06, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:33:02", "remaining_time": "0:00:00"}
|
| 33 |
+
{"current_steps": 300, "total_steps": 300, "eval_loss": 0.9554556012153625, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:34:47", "remaining_time": "0:00:00"}
|
| 34 |
+
{"current_steps": 300, "total_steps": 300, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:36:23", "remaining_time": "0:00:00"}
|