Model save
Browse files- all_results.json +4 -4
- eval_results.json +4 -4
- trainer_state.json +8 -0
all_results.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 6.6440677966101696,
|
| 3 |
-
"eval_loss": 2.
|
| 4 |
-
"eval_runtime": 16.
|
| 5 |
-
"eval_samples_per_second": 43.
|
| 6 |
-
"eval_steps_per_second": 5.
|
| 7 |
"total_flos": 5.749859310737818e+16,
|
| 8 |
"train_loss": 0.9609878695740992,
|
| 9 |
"train_runtime": 1272.9991,
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 6.6440677966101696,
|
| 3 |
+
"eval_loss": 2.681103229522705,
|
| 4 |
+
"eval_runtime": 16.2756,
|
| 5 |
+
"eval_samples_per_second": 43.501,
|
| 6 |
+
"eval_steps_per_second": 5.468,
|
| 7 |
"total_flos": 5.749859310737818e+16,
|
| 8 |
"train_loss": 0.9609878695740992,
|
| 9 |
"train_runtime": 1272.9991,
|
eval_results.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 6.6440677966101696,
|
| 3 |
-
"eval_loss": 2.
|
| 4 |
-
"eval_runtime": 16.
|
| 5 |
-
"eval_samples_per_second": 43.
|
| 6 |
-
"eval_steps_per_second": 5.
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 6.6440677966101696,
|
| 3 |
+
"eval_loss": 2.681103229522705,
|
| 4 |
+
"eval_runtime": 16.2756,
|
| 5 |
+
"eval_samples_per_second": 43.501,
|
| 6 |
+
"eval_steps_per_second": 5.468
|
| 7 |
}
|
trainer_state.json
CHANGED
|
@@ -167,6 +167,14 @@
|
|
| 167 |
"eval_samples_per_second": 43.971,
|
| 168 |
"eval_steps_per_second": 5.527,
|
| 169 |
"step": 98
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 170 |
}
|
| 171 |
],
|
| 172 |
"logging_steps": 10,
|
|
|
|
| 167 |
"eval_samples_per_second": 43.971,
|
| 168 |
"eval_steps_per_second": 5.527,
|
| 169 |
"step": 98
|
| 170 |
+
},
|
| 171 |
+
{
|
| 172 |
+
"epoch": 6.6440677966101696,
|
| 173 |
+
"eval_loss": 2.6798176765441895,
|
| 174 |
+
"eval_runtime": 16.1818,
|
| 175 |
+
"eval_samples_per_second": 43.753,
|
| 176 |
+
"eval_steps_per_second": 5.5,
|
| 177 |
+
"step": 98
|
| 178 |
}
|
| 179 |
],
|
| 180 |
"logging_steps": 10,
|