Training in progress, epoch 2, checkpoint
Browse files
checkpoint-5518/trainer_state.json
CHANGED
|
@@ -27,9 +27,9 @@
|
|
| 27 |
"epoch": 0.36258158085569253,
|
| 28 |
"eval_cosine_accuracy": 0.9711852073669434,
|
| 29 |
"eval_loss": 0.3902958035469055,
|
| 30 |
-
"eval_runtime": 34.
|
| 31 |
-
"eval_samples_per_second":
|
| 32 |
-
"eval_steps_per_second": 1.
|
| 33 |
"step": 1000
|
| 34 |
},
|
| 35 |
{
|
|
@@ -43,9 +43,9 @@
|
|
| 43 |
"epoch": 0.7251631617113851,
|
| 44 |
"eval_cosine_accuracy": 0.9699232578277588,
|
| 45 |
"eval_loss": 0.37875595688819885,
|
| 46 |
-
"eval_runtime":
|
| 47 |
-
"eval_samples_per_second":
|
| 48 |
-
"eval_steps_per_second": 1.
|
| 49 |
"step": 2000
|
| 50 |
},
|
| 51 |
{
|
|
@@ -59,9 +59,9 @@
|
|
| 59 |
"epoch": 1.0876811594202898,
|
| 60 |
"eval_cosine_accuracy": 0.9716058373451233,
|
| 61 |
"eval_loss": 0.3854234516620636,
|
| 62 |
-
"eval_runtime": 34.
|
| 63 |
-
"eval_samples_per_second":
|
| 64 |
-
"eval_steps_per_second": 1.
|
| 65 |
"step": 3000
|
| 66 |
},
|
| 67 |
{
|
|
@@ -75,9 +75,9 @@
|
|
| 75 |
"epoch": 1.45,
|
| 76 |
"eval_cosine_accuracy": 0.9708697199821472,
|
| 77 |
"eval_loss": 0.3814031183719635,
|
| 78 |
-
"eval_runtime":
|
| 79 |
-
"eval_samples_per_second":
|
| 80 |
-
"eval_steps_per_second": 1.
|
| 81 |
"step": 4000
|
| 82 |
},
|
| 83 |
{
|
|
@@ -91,9 +91,9 @@
|
|
| 91 |
"epoch": 1.8123188405797102,
|
| 92 |
"eval_cosine_accuracy": 0.9710800051689148,
|
| 93 |
"eval_loss": 0.38102903962135315,
|
| 94 |
-
"eval_runtime":
|
| 95 |
-
"eval_samples_per_second":
|
| 96 |
-
"eval_steps_per_second": 1.
|
| 97 |
"step": 5000
|
| 98 |
}
|
| 99 |
],
|
|
|
|
| 27 |
"epoch": 0.36258158085569253,
|
| 28 |
"eval_cosine_accuracy": 0.9711852073669434,
|
| 29 |
"eval_loss": 0.3902958035469055,
|
| 30 |
+
"eval_runtime": 34.6603,
|
| 31 |
+
"eval_samples_per_second": 274.348,
|
| 32 |
+
"eval_steps_per_second": 1.096,
|
| 33 |
"step": 1000
|
| 34 |
},
|
| 35 |
{
|
|
|
|
| 43 |
"epoch": 0.7251631617113851,
|
| 44 |
"eval_cosine_accuracy": 0.9699232578277588,
|
| 45 |
"eval_loss": 0.37875595688819885,
|
| 46 |
+
"eval_runtime": 33.7082,
|
| 47 |
+
"eval_samples_per_second": 282.098,
|
| 48 |
+
"eval_steps_per_second": 1.127,
|
| 49 |
"step": 2000
|
| 50 |
},
|
| 51 |
{
|
|
|
|
| 59 |
"epoch": 1.0876811594202898,
|
| 60 |
"eval_cosine_accuracy": 0.9716058373451233,
|
| 61 |
"eval_loss": 0.3854234516620636,
|
| 62 |
+
"eval_runtime": 34.2421,
|
| 63 |
+
"eval_samples_per_second": 277.699,
|
| 64 |
+
"eval_steps_per_second": 1.11,
|
| 65 |
"step": 3000
|
| 66 |
},
|
| 67 |
{
|
|
|
|
| 75 |
"epoch": 1.45,
|
| 76 |
"eval_cosine_accuracy": 0.9708697199821472,
|
| 77 |
"eval_loss": 0.3814031183719635,
|
| 78 |
+
"eval_runtime": 33.9647,
|
| 79 |
+
"eval_samples_per_second": 279.967,
|
| 80 |
+
"eval_steps_per_second": 1.119,
|
| 81 |
"step": 4000
|
| 82 |
},
|
| 83 |
{
|
|
|
|
| 91 |
"epoch": 1.8123188405797102,
|
| 92 |
"eval_cosine_accuracy": 0.9710800051689148,
|
| 93 |
"eval_loss": 0.38102903962135315,
|
| 94 |
+
"eval_runtime": 34.858,
|
| 95 |
+
"eval_samples_per_second": 272.792,
|
| 96 |
+
"eval_steps_per_second": 1.09,
|
| 97 |
"step": 5000
|
| 98 |
}
|
| 99 |
],
|
checkpoint-5518/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98354e6a6ec8411cdce0c11c2d3311243c8acedb0b90e2b2c87806e8519cdf4b
|
| 3 |
size 5752
|