Commit Β·
5f95b96
1
Parent(s): 90f5ea7
Training in progress, step 2000
Browse files- {checkpoint-500 β checkpoint-2000}/config.json +0 -0
- {checkpoint-500 β checkpoint-2000}/optimizer.pt +1 -1
- {checkpoint-500 β checkpoint-2000}/preprocessor_config.json +0 -0
- {checkpoint-500 β checkpoint-2000}/pytorch_model.bin +1 -1
- {checkpoint-500 β checkpoint-2000}/rng_state.pth +1 -1
- {checkpoint-500 β checkpoint-2000}/scaler.pt +1 -1
- {checkpoint-500 β checkpoint-2000}/scheduler.pt +1 -1
- {checkpoint-500 β checkpoint-2000}/trainer_state.json +50 -5
- {checkpoint-500 β checkpoint-2000}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Mar29_09-49-04_9cd49a3ed4d1/events.out.tfevents.1774778031.9cd49a3ed4d1.24900.0 +2 -2
{checkpoint-500 β checkpoint-2000}/config.json
RENAMED
|
File without changes
|
{checkpoint-500 β checkpoint-2000}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 721687499
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64d22661dcba3d0cb6d911b4bd416db42117c6811d3cf45df55a7e83a9134508
|
| 3 |
size 721687499
|
{checkpoint-500 β checkpoint-2000}/preprocessor_config.json
RENAMED
|
File without changes
|
{checkpoint-500 β checkpoint-2000}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377674359
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a292bb26d6fc95282e7803a4a5b79608fdb1b8c7e82347ddc648c085b668783f
|
| 3 |
size 377674359
|
{checkpoint-500 β checkpoint-2000}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14709
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98686e7580d7add044a34553ef0317cad35ddac85e33e65313c14e5e9b3231ea
|
| 3 |
size 14709
|
{checkpoint-500 β checkpoint-2000}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50786c05f475ef653b53ebc3a6daee74f887308e526f335b68aa5669a6ae4442
|
| 3 |
size 1383
|
{checkpoint-500 β checkpoint-2000}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1c7208a78c4eead1aea111474a41ee9bbf256971f80fae940dad9bf17894d12
|
| 3 |
size 1465
|
{checkpoint-500 β checkpoint-2000}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric":
|
| 3 |
-
"best_model_checkpoint": "JuanPajero/FT-XS2/checkpoint-
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -21,11 +21,56 @@
|
|
| 21 |
"eval_steps_per_second": 1.726,
|
| 22 |
"eval_wer": 0.9992262457443516,
|
| 23 |
"step": 500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
}
|
| 25 |
],
|
| 26 |
"max_steps": 2940,
|
| 27 |
"num_train_epochs": 10,
|
| 28 |
-
"total_flos":
|
| 29 |
"trial_name": null,
|
| 30 |
"trial_params": null
|
| 31 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 1.0205419063568115,
|
| 3 |
+
"best_model_checkpoint": "JuanPajero/FT-XS2/checkpoint-1500",
|
| 4 |
+
"epoch": 6.802721088435375,
|
| 5 |
+
"global_step": 2000,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 21 |
"eval_steps_per_second": 1.726,
|
| 22 |
"eval_wer": 0.9992262457443516,
|
| 23 |
"step": 500
|
| 24 |
+
},
|
| 25 |
+
{
|
| 26 |
+
"epoch": 3.4,
|
| 27 |
+
"learning_rate": 2.2029478458049888e-05,
|
| 28 |
+
"loss": 1.3402,
|
| 29 |
+
"step": 1000
|
| 30 |
+
},
|
| 31 |
+
{
|
| 32 |
+
"epoch": 3.4,
|
| 33 |
+
"eval_loss": 1.416143536567688,
|
| 34 |
+
"eval_runtime": 407.671,
|
| 35 |
+
"eval_samples_per_second": 14.019,
|
| 36 |
+
"eval_steps_per_second": 1.754,
|
| 37 |
+
"eval_wer": 0.6038765088207985,
|
| 38 |
+
"step": 1000
|
| 39 |
+
},
|
| 40 |
+
{
|
| 41 |
+
"epoch": 5.1,
|
| 42 |
+
"learning_rate": 1.6360544217687075e-05,
|
| 43 |
+
"loss": 0.7515,
|
| 44 |
+
"step": 1500
|
| 45 |
+
},
|
| 46 |
+
{
|
| 47 |
+
"epoch": 5.1,
|
| 48 |
+
"eval_loss": 1.0205419063568115,
|
| 49 |
+
"eval_runtime": 410.6786,
|
| 50 |
+
"eval_samples_per_second": 13.916,
|
| 51 |
+
"eval_steps_per_second": 1.741,
|
| 52 |
+
"eval_wer": 0.4986459300526153,
|
| 53 |
+
"step": 1500
|
| 54 |
+
},
|
| 55 |
+
{
|
| 56 |
+
"epoch": 6.8,
|
| 57 |
+
"learning_rate": 1.0691609977324262e-05,
|
| 58 |
+
"loss": 0.6136,
|
| 59 |
+
"step": 2000
|
| 60 |
+
},
|
| 61 |
+
{
|
| 62 |
+
"epoch": 6.8,
|
| 63 |
+
"eval_loss": 1.0564398765563965,
|
| 64 |
+
"eval_runtime": 410.9183,
|
| 65 |
+
"eval_samples_per_second": 13.908,
|
| 66 |
+
"eval_steps_per_second": 1.74,
|
| 67 |
+
"eval_wer": 0.4804704425874342,
|
| 68 |
+
"step": 2000
|
| 69 |
}
|
| 70 |
],
|
| 71 |
"max_steps": 2940,
|
| 72 |
"num_train_epochs": 10,
|
| 73 |
+
"total_flos": 2.357760234513715e+18,
|
| 74 |
"trial_name": null,
|
| 75 |
"trial_params": null
|
| 76 |
}
|
{checkpoint-500 β checkpoint-2000}/training_args.bin
RENAMED
|
File without changes
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377674359
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a292bb26d6fc95282e7803a4a5b79608fdb1b8c7e82347ddc648c085b668783f
|
| 3 |
size 377674359
|
runs/Mar29_09-49-04_9cd49a3ed4d1/events.out.tfevents.1774778031.9cd49a3ed4d1.24900.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dab4dc11c82ddefba06bbd00f5a28f8cfa50916188b54c369f7a30257486fc3d
|
| 3 |
+
size 6959
|