End of training
Browse files- all_results.json +6 -6
- eval_results.json +3 -3
- runs/Aug06_15-17-30_dsai-server/events.out.tfevents.1691327490.dsai-server +3 -0
- train_results.json +3 -3
- trainer_state.json +18 -18
all_results.json
CHANGED
|
@@ -1,12 +1,12 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 2.42,
|
| 3 |
"eval_loss": 0.4997063875198364,
|
| 4 |
-
"eval_runtime":
|
| 5 |
-
"eval_samples_per_second":
|
| 6 |
-
"eval_steps_per_second":
|
| 7 |
"eval_wer": 32.55118472509777,
|
| 8 |
"train_loss": 0.557375843334198,
|
| 9 |
-
"train_runtime":
|
| 10 |
-
"train_samples_per_second":
|
| 11 |
-
"train_steps_per_second":
|
| 12 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 2.42,
|
| 3 |
"eval_loss": 0.4997063875198364,
|
| 4 |
+
"eval_runtime": 1863.5809,
|
| 5 |
+
"eval_samples_per_second": 1.944,
|
| 6 |
+
"eval_steps_per_second": 0.972,
|
| 7 |
"eval_wer": 32.55118472509777,
|
| 8 |
"train_loss": 0.557375843334198,
|
| 9 |
+
"train_runtime": 15732.1346,
|
| 10 |
+
"train_samples_per_second": 1.271,
|
| 11 |
+
"train_steps_per_second": 0.318
|
| 12 |
}
|
eval_results.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 2.42,
|
| 3 |
"eval_loss": 0.4997063875198364,
|
| 4 |
-
"eval_runtime":
|
| 5 |
-
"eval_samples_per_second":
|
| 6 |
-
"eval_steps_per_second":
|
| 7 |
"eval_wer": 32.55118472509777
|
| 8 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 2.42,
|
| 3 |
"eval_loss": 0.4997063875198364,
|
| 4 |
+
"eval_runtime": 1863.5809,
|
| 5 |
+
"eval_samples_per_second": 1.944,
|
| 6 |
+
"eval_steps_per_second": 0.972,
|
| 7 |
"eval_wer": 32.55118472509777
|
| 8 |
}
|
runs/Aug06_15-17-30_dsai-server/events.out.tfevents.1691327490.dsai-server
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5aa5e50dd77bf7ea5c0b55f72aef37b60e071b7908e122f5ad6463de79711c46
|
| 3 |
+
size 40
|
train_results.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 2.42,
|
| 3 |
"train_loss": 0.557375843334198,
|
| 4 |
-
"train_runtime":
|
| 5 |
-
"train_samples_per_second":
|
| 6 |
-
"train_steps_per_second":
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 2.42,
|
| 3 |
"train_loss": 0.557375843334198,
|
| 4 |
+
"train_runtime": 15732.1346,
|
| 5 |
+
"train_samples_per_second": 1.271,
|
| 6 |
+
"train_steps_per_second": 0.318
|
| 7 |
}
|
trainer_state.json
CHANGED
|
@@ -250,9 +250,9 @@
|
|
| 250 |
{
|
| 251 |
"epoch": 0.48,
|
| 252 |
"eval_loss": 0.6328660845756531,
|
| 253 |
-
"eval_runtime":
|
| 254 |
-
"eval_samples_per_second":
|
| 255 |
-
"eval_steps_per_second":
|
| 256 |
"eval_wer": 42.10720036806993,
|
| 257 |
"step": 1000
|
| 258 |
},
|
|
@@ -499,9 +499,9 @@
|
|
| 499 |
{
|
| 500 |
"epoch": 0.97,
|
| 501 |
"eval_loss": 0.5514832139015198,
|
| 502 |
-
"eval_runtime":
|
| 503 |
-
"eval_samples_per_second":
|
| 504 |
-
"eval_steps_per_second":
|
| 505 |
"eval_wer": 35.86381412468369,
|
| 506 |
"step": 2000
|
| 507 |
},
|
|
@@ -748,9 +748,9 @@
|
|
| 748 |
{
|
| 749 |
"epoch": 1.45,
|
| 750 |
"eval_loss": 0.5231785178184509,
|
| 751 |
-
"eval_runtime":
|
| 752 |
-
"eval_samples_per_second":
|
| 753 |
-
"eval_steps_per_second":
|
| 754 |
"eval_wer": 34.018863584080975,
|
| 755 |
"step": 3000
|
| 756 |
},
|
|
@@ -997,9 +997,9 @@
|
|
| 997 |
{
|
| 998 |
"epoch": 1.94,
|
| 999 |
"eval_loss": 0.49930620193481445,
|
| 1000 |
-
"eval_runtime":
|
| 1001 |
-
"eval_samples_per_second":
|
| 1002 |
-
"eval_steps_per_second":
|
| 1003 |
"eval_wer": 32.67080745341615,
|
| 1004 |
"step": 4000
|
| 1005 |
},
|
|
@@ -1246,9 +1246,9 @@
|
|
| 1246 |
{
|
| 1247 |
"epoch": 2.42,
|
| 1248 |
"eval_loss": 0.4997063875198364,
|
| 1249 |
-
"eval_runtime":
|
| 1250 |
-
"eval_samples_per_second":
|
| 1251 |
-
"eval_steps_per_second":
|
| 1252 |
"eval_wer": 32.55118472509777,
|
| 1253 |
"step": 5000
|
| 1254 |
},
|
|
@@ -1257,9 +1257,9 @@
|
|
| 1257 |
"step": 5000,
|
| 1258 |
"total_flos": 4.9222998908928e+17,
|
| 1259 |
"train_loss": 0.557375843334198,
|
| 1260 |
-
"train_runtime":
|
| 1261 |
-
"train_samples_per_second":
|
| 1262 |
-
"train_steps_per_second":
|
| 1263 |
}
|
| 1264 |
],
|
| 1265 |
"max_steps": 5000,
|
|
|
|
| 250 |
{
|
| 251 |
"epoch": 0.48,
|
| 252 |
"eval_loss": 0.6328660845756531,
|
| 253 |
+
"eval_runtime": 2032.5756,
|
| 254 |
+
"eval_samples_per_second": 1.782,
|
| 255 |
+
"eval_steps_per_second": 0.891,
|
| 256 |
"eval_wer": 42.10720036806993,
|
| 257 |
"step": 1000
|
| 258 |
},
|
|
|
|
| 499 |
{
|
| 500 |
"epoch": 0.97,
|
| 501 |
"eval_loss": 0.5514832139015198,
|
| 502 |
+
"eval_runtime": 1912.9967,
|
| 503 |
+
"eval_samples_per_second": 1.893,
|
| 504 |
+
"eval_steps_per_second": 0.947,
|
| 505 |
"eval_wer": 35.86381412468369,
|
| 506 |
"step": 2000
|
| 507 |
},
|
|
|
|
| 748 |
{
|
| 749 |
"epoch": 1.45,
|
| 750 |
"eval_loss": 0.5231785178184509,
|
| 751 |
+
"eval_runtime": 1911.8055,
|
| 752 |
+
"eval_samples_per_second": 1.895,
|
| 753 |
+
"eval_steps_per_second": 0.947,
|
| 754 |
"eval_wer": 34.018863584080975,
|
| 755 |
"step": 3000
|
| 756 |
},
|
|
|
|
| 997 |
{
|
| 998 |
"epoch": 1.94,
|
| 999 |
"eval_loss": 0.49930620193481445,
|
| 1000 |
+
"eval_runtime": 1866.5046,
|
| 1001 |
+
"eval_samples_per_second": 1.941,
|
| 1002 |
+
"eval_steps_per_second": 0.97,
|
| 1003 |
"eval_wer": 32.67080745341615,
|
| 1004 |
"step": 4000
|
| 1005 |
},
|
|
|
|
| 1246 |
{
|
| 1247 |
"epoch": 2.42,
|
| 1248 |
"eval_loss": 0.4997063875198364,
|
| 1249 |
+
"eval_runtime": 1867.4461,
|
| 1250 |
+
"eval_samples_per_second": 1.94,
|
| 1251 |
+
"eval_steps_per_second": 0.97,
|
| 1252 |
"eval_wer": 32.55118472509777,
|
| 1253 |
"step": 5000
|
| 1254 |
},
|
|
|
|
| 1257 |
"step": 5000,
|
| 1258 |
"total_flos": 4.9222998908928e+17,
|
| 1259 |
"train_loss": 0.557375843334198,
|
| 1260 |
+
"train_runtime": 15732.1346,
|
| 1261 |
+
"train_samples_per_second": 1.271,
|
| 1262 |
+
"train_steps_per_second": 0.318
|
| 1263 |
}
|
| 1264 |
],
|
| 1265 |
"max_steps": 5000,
|