Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a303b84070f5c585fec3e860afcc199c8d0cb9200ce1330b95d45c4fd843e9c
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51169d2bf398480aa6e78672e22ee4466c4185a658afadbeffb83bc9531ab598
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f45d2c5f626a8672934eacf676d79331a6827b62168fe6d8036cf154baeab91
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0eaf0c6a76b771275b1305d9d7b5d9c7fd2f33a1071727f9943be04cfe9bfbe2
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -16,3 +16,13 @@
|
|
| 16 |
{"current_steps": 16, "total_steps": 117, "loss": 0.5685, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:06:38", "remaining_time": "0:41:56"}
|
| 17 |
{"current_steps": 17, "total_steps": 117, "loss": 0.5271, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:06:55", "remaining_time": "0:40:44"}
|
| 18 |
{"current_steps": 18, "total_steps": 117, "loss": 0.4994, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:07:15", "remaining_time": "0:39:53"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 16 |
{"current_steps": 16, "total_steps": 117, "loss": 0.5685, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:06:38", "remaining_time": "0:41:56"}
|
| 17 |
{"current_steps": 17, "total_steps": 117, "loss": 0.5271, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:06:55", "remaining_time": "0:40:44"}
|
| 18 |
{"current_steps": 18, "total_steps": 117, "loss": 0.4994, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:07:15", "remaining_time": "0:39:53"}
|
| 19 |
+
{"current_steps": 19, "total_steps": 117, "loss": 0.5071, "lr": 9.890738003669029e-06, "epoch": 1.9620253164556962, "percentage": 16.24, "elapsed_time": "0:07:45", "remaining_time": "0:40:01"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 117, "loss": 0.4746, "lr": 9.857450191464337e-06, "epoch": 2.1012658227848102, "percentage": 17.09, "elapsed_time": "0:08:55", "remaining_time": "0:43:17"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 117, "loss": 0.4618, "lr": 9.819814303479268e-06, "epoch": 2.2025316455696204, "percentage": 17.95, "elapsed_time": "0:09:24", "remaining_time": "0:43:02"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 117, "loss": 0.4508, "lr": 9.777864028930705e-06, "epoch": 2.3037974683544302, "percentage": 18.8, "elapsed_time": "0:09:52", "remaining_time": "0:42:39"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 117, "loss": 0.3964, "lr": 9.731636918995821e-06, "epoch": 2.4050632911392404, "percentage": 19.66, "elapsed_time": "0:10:09", "remaining_time": "0:41:29"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 117, "loss": 0.4052, "lr": 9.681174353198687e-06, "epoch": 2.5063291139240507, "percentage": 20.51, "elapsed_time": "0:10:26", "remaining_time": "0:40:29"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 117, "loss": 0.4393, "lr": 9.626521502369984e-06, "epoch": 2.607594936708861, "percentage": 21.37, "elapsed_time": "0:10:53", "remaining_time": "0:40:05"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 117, "loss": 0.4439, "lr": 9.567727288213005e-06, "epoch": 2.708860759493671, "percentage": 22.22, "elapsed_time": "0:11:13", "remaining_time": "0:39:16"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 117, "loss": 0.3915, "lr": 9.504844339512096e-06, "epoch": 2.810126582278481, "percentage": 23.08, "elapsed_time": "0:11:33", "remaining_time": "0:38:31"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 117, "loss": 0.391, "lr": 9.437928945022772e-06, "epoch": 2.911392405063291, "percentage": 23.93, "elapsed_time": "0:11:50", "remaining_time": "0:37:37"}
|