Commit Β·
f96514a
1
Parent(s): 76d7629
Training in progress, step 35500
Browse files- {checkpoint-14200 β checkpoint-35500}/config.json +0 -0
- {checkpoint-14200 β checkpoint-35500}/optimizer.pt +1 -1
- {checkpoint-14200 β checkpoint-35500}/preprocessor_config.json +0 -0
- {checkpoint-14200 β checkpoint-35500}/pytorch_model.bin +1 -1
- {checkpoint-14200 β checkpoint-35500}/rng_state.pth +1 -1
- {checkpoint-14200 β checkpoint-35500}/scaler.pt +1 -1
- {checkpoint-14200 β checkpoint-35500}/scheduler.pt +1 -1
- {checkpoint-14200 β checkpoint-35500}/trainer_state.json +50 -5
- {checkpoint-14200 β checkpoint-35500}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Mar22_03-10-48_48c38934e4d2/events.out.tfevents.1774154952.48c38934e4d2.13068.0 +2 -2
{checkpoint-14200 β checkpoint-35500}/config.json
RENAMED
|
File without changes
|
{checkpoint-14200 β checkpoint-35500}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 721687499
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2852db7cf014b14489b48c2b4434ecfc606da92d93234e33d8ab765f212d43ac
|
| 3 |
size 721687499
|
{checkpoint-14200 β checkpoint-35500}/preprocessor_config.json
RENAMED
|
File without changes
|
{checkpoint-14200 β checkpoint-35500}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377674359
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f6a91c0cd3efa0326503b4148695da414af93512af37092a4f75e483f5b7886
|
| 3 |
size 377674359
|
{checkpoint-14200 β checkpoint-35500}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14773
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c57cd849ea7c0f7c68a597c364a643221c2bec00262fd4d7f58e148e5f4e191b
|
| 3 |
size 14773
|
{checkpoint-14200 β checkpoint-35500}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16be25ec3156a8306d0d1d2d1e342085ac407c8f872a2b9638fdc2d2263d1aa3
|
| 3 |
size 1383
|
{checkpoint-14200 β checkpoint-35500}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e397eca0724de78a0bcb22ea0120cbc2c4e2e3481857c7f086bf94efbedf9e94
|
| 3 |
size 1465
|
{checkpoint-14200 β checkpoint-35500}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric": 0.
|
| 3 |
-
"best_model_checkpoint": "JuanPajero/FT-S3/checkpoint-
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -36,11 +36,56 @@
|
|
| 36 |
"eval_steps_per_second": 2.061,
|
| 37 |
"eval_wer": 0.31068540368553627,
|
| 38 |
"step": 14200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
}
|
| 40 |
],
|
| 41 |
"max_steps": 71900,
|
| 42 |
"num_train_epochs": 10,
|
| 43 |
-
"total_flos":
|
| 44 |
"trial_name": null,
|
| 45 |
"trial_params": null
|
| 46 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 0.6885841488838196,
|
| 3 |
+
"best_model_checkpoint": "JuanPajero/FT-S3/checkpoint-21300",
|
| 4 |
+
"epoch": 4.937413073713491,
|
| 5 |
+
"global_step": 35500,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 36 |
"eval_steps_per_second": 2.061,
|
| 37 |
"eval_wer": 0.31068540368553627,
|
| 38 |
"step": 14200
|
| 39 |
+
},
|
| 40 |
+
{
|
| 41 |
+
"epoch": 2.96,
|
| 42 |
+
"learning_rate": 2.3462679647658787e-05,
|
| 43 |
+
"loss": 0.338,
|
| 44 |
+
"step": 21300
|
| 45 |
+
},
|
| 46 |
+
{
|
| 47 |
+
"epoch": 2.96,
|
| 48 |
+
"eval_loss": 0.6885841488838196,
|
| 49 |
+
"eval_runtime": 1207.7134,
|
| 50 |
+
"eval_samples_per_second": 16.501,
|
| 51 |
+
"eval_steps_per_second": 2.063,
|
| 52 |
+
"eval_wer": 0.2933106599088304,
|
| 53 |
+
"step": 21300
|
| 54 |
+
},
|
| 55 |
+
{
|
| 56 |
+
"epoch": 3.95,
|
| 57 |
+
"learning_rate": 2.0172461752433936e-05,
|
| 58 |
+
"loss": 0.3011,
|
| 59 |
+
"step": 28400
|
| 60 |
+
},
|
| 61 |
+
{
|
| 62 |
+
"epoch": 3.95,
|
| 63 |
+
"eval_loss": 0.7342329621315002,
|
| 64 |
+
"eval_runtime": 1203.3539,
|
| 65 |
+
"eval_samples_per_second": 16.56,
|
| 66 |
+
"eval_steps_per_second": 2.07,
|
| 67 |
+
"eval_wer": 0.28296994666476305,
|
| 68 |
+
"step": 28400
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"epoch": 4.94,
|
| 72 |
+
"learning_rate": 1.688270746407047e-05,
|
| 73 |
+
"loss": 0.2763,
|
| 74 |
+
"step": 35500
|
| 75 |
+
},
|
| 76 |
+
{
|
| 77 |
+
"epoch": 4.94,
|
| 78 |
+
"eval_loss": 0.7109239101409912,
|
| 79 |
+
"eval_runtime": 1205.3003,
|
| 80 |
+
"eval_samples_per_second": 16.534,
|
| 81 |
+
"eval_steps_per_second": 2.067,
|
| 82 |
+
"eval_wer": 0.2757370562620463,
|
| 83 |
+
"step": 35500
|
| 84 |
}
|
| 85 |
],
|
| 86 |
"max_steps": 71900,
|
| 87 |
"num_train_epochs": 10,
|
| 88 |
+
"total_flos": 4.242114943584952e+19,
|
| 89 |
"trial_name": null,
|
| 90 |
"trial_params": null
|
| 91 |
}
|
{checkpoint-14200 β checkpoint-35500}/training_args.bin
RENAMED
|
File without changes
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377674359
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f6a91c0cd3efa0326503b4148695da414af93512af37092a4f75e483f5b7886
|
| 3 |
size 377674359
|
runs/Mar22_03-10-48_48c38934e4d2/events.out.tfevents.1774154952.48c38934e4d2.13068.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ea1f4ca7c8ae4baa6f5c6635fafb4d811b283af4126a373e662e5eeb816106d
|
| 3 |
+
size 7460
|