Training in progress, step 14
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +15 -15
- training_args.bin +1 -1
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b109edb65db33ea41d84de2e6da4eadf0a60e181c6784b8cc788958841ce58ae
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f7110eae4f21fd28da975252d2e5a987220e9c480ac7e48868717e7e56f3b6b
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:216bac96ffb270d9f00fac634f79b36d337d7e96fdd3bb936e3a31994468f2f8
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d65cd8d169dc0ffdb9a0d698df37e775c102c4296a8124b1e098c85456b3788
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -1,15 +1,15 @@
|
|
| 1 |
-
{"current_steps": 1, "total_steps": 14, "loss": 1.3139, "lr": 0.0, "epoch": 0.12631578947368421, "percentage": 7.14, "elapsed_time": "0:00:27", "remaining_time": "0:05:
|
| 2 |
-
{"current_steps": 2, "total_steps": 14, "loss": 1.3348, "lr": 5e-06, "epoch": 0.25263157894736843, "percentage": 14.29, "elapsed_time": "0:00:45", "remaining_time": "0:04:
|
| 3 |
-
{"current_steps": 3, "total_steps": 14, "loss": 1.
|
| 4 |
-
{"current_steps": 4, "total_steps": 14, "loss": 1.
|
| 5 |
-
{"current_steps": 5, "total_steps": 14, "loss": 1.
|
| 6 |
-
{"current_steps": 6, "total_steps": 14, "loss": 1.
|
| 7 |
-
{"current_steps": 7, "total_steps": 14, "loss": 1.
|
| 8 |
-
{"current_steps": 8, "total_steps": 14, "loss": 2.
|
| 9 |
-
{"current_steps": 9, "total_steps": 14, "loss": 1.
|
| 10 |
-
{"current_steps": 10, "total_steps": 14, "loss": 0.
|
| 11 |
-
{"current_steps": 11, "total_steps": 14, "loss": 0.9933, "lr": 2.5000000000000015e-06, "epoch": 1.5052631578947369, "percentage": 78.57, "elapsed_time": "0:
|
| 12 |
-
{"current_steps": 12, "total_steps": 14, "loss": 1.
|
| 13 |
-
{"current_steps": 13, "total_steps": 14, "loss": 1.
|
| 14 |
-
{"current_steps": 14, "total_steps": 14, "loss": 0.
|
| 15 |
-
{"current_steps": 14, "total_steps": 14, "epoch": 1.8842105263157896, "percentage": 100.0, "elapsed_time": "0:06:
|
|
|
|
| 1 |
+
{"current_steps": 1, "total_steps": 14, "loss": 1.3139, "lr": 0.0, "epoch": 0.12631578947368421, "percentage": 7.14, "elapsed_time": "0:00:27", "remaining_time": "0:05:51"}
|
| 2 |
+
{"current_steps": 2, "total_steps": 14, "loss": 1.3348, "lr": 5e-06, "epoch": 0.25263157894736843, "percentage": 14.29, "elapsed_time": "0:00:45", "remaining_time": "0:04:32"}
|
| 3 |
+
{"current_steps": 3, "total_steps": 14, "loss": 1.2368, "lr": 1e-05, "epoch": 0.37894736842105264, "percentage": 21.43, "elapsed_time": "0:01:07", "remaining_time": "0:04:07"}
|
| 4 |
+
{"current_steps": 4, "total_steps": 14, "loss": 1.1371, "lr": 9.829629131445342e-06, "epoch": 0.5052631578947369, "percentage": 28.57, "elapsed_time": "0:01:24", "remaining_time": "0:03:30"}
|
| 5 |
+
{"current_steps": 5, "total_steps": 14, "loss": 1.1389, "lr": 9.330127018922195e-06, "epoch": 0.631578947368421, "percentage": 35.71, "elapsed_time": "0:01:43", "remaining_time": "0:03:05"}
|
| 6 |
+
{"current_steps": 6, "total_steps": 14, "loss": 1.066, "lr": 8.535533905932739e-06, "epoch": 0.7578947368421053, "percentage": 42.86, "elapsed_time": "0:02:05", "remaining_time": "0:02:46"}
|
| 7 |
+
{"current_steps": 7, "total_steps": 14, "loss": 1.1584, "lr": 7.500000000000001e-06, "epoch": 0.8842105263157894, "percentage": 50.0, "elapsed_time": "0:02:25", "remaining_time": "0:02:25"}
|
| 8 |
+
{"current_steps": 8, "total_steps": 14, "loss": 2.098, "lr": 6.294095225512604e-06, "epoch": 1.1263157894736842, "percentage": 57.14, "elapsed_time": "0:03:03", "remaining_time": "0:02:17"}
|
| 9 |
+
{"current_steps": 9, "total_steps": 14, "loss": 1.0779, "lr": 5e-06, "epoch": 1.2526315789473683, "percentage": 64.29, "elapsed_time": "0:03:24", "remaining_time": "0:01:53"}
|
| 10 |
+
{"current_steps": 10, "total_steps": 14, "loss": 0.9586, "lr": 3.705904774487396e-06, "epoch": 1.3789473684210527, "percentage": 71.43, "elapsed_time": "0:03:41", "remaining_time": "0:01:28"}
|
| 11 |
+
{"current_steps": 11, "total_steps": 14, "loss": 0.9933, "lr": 2.5000000000000015e-06, "epoch": 1.5052631578947369, "percentage": 78.57, "elapsed_time": "0:03:59", "remaining_time": "0:01:05"}
|
| 12 |
+
{"current_steps": 12, "total_steps": 14, "loss": 1.0243, "lr": 1.4644660940672628e-06, "epoch": 1.631578947368421, "percentage": 85.71, "elapsed_time": "0:04:17", "remaining_time": "0:00:42"}
|
| 13 |
+
{"current_steps": 13, "total_steps": 14, "loss": 1.0271, "lr": 6.698729810778065e-07, "epoch": 1.7578947368421054, "percentage": 92.86, "elapsed_time": "0:04:37", "remaining_time": "0:00:21"}
|
| 14 |
+
{"current_steps": 14, "total_steps": 14, "loss": 0.94, "lr": 1.7037086855465902e-07, "epoch": 1.8842105263157896, "percentage": 100.0, "elapsed_time": "0:04:58", "remaining_time": "0:00:00"}
|
| 15 |
+
{"current_steps": 14, "total_steps": 14, "epoch": 1.8842105263157896, "percentage": 100.0, "elapsed_time": "0:06:06", "remaining_time": "0:00:00"}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7800
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bded2ee1a3e4a6652222eb0c7478a16ce64b03d52a10847551afbccd9a96bf4b
|
| 3 |
size 7800
|