Model save
Browse files- README.md +33 -33
- config.json +4 -4
- model.safetensors +1 -1
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
|
|
| 17 |
|
| 18 |
This model is a fine-tuned version of [facebook/wav2vec2-base-960h](https://huggingface.co/facebook/wav2vec2-base-960h) on an unknown dataset.
|
| 19 |
It achieves the following results on the evaluation set:
|
| 20 |
-
- Loss:
|
| 21 |
-
- Wer: 0.
|
| 22 |
|
| 23 |
## Model description
|
| 24 |
|
|
@@ -37,7 +37,7 @@ More information needed
|
|
| 37 |
### Training hyperparameters
|
| 38 |
|
| 39 |
The following hyperparameters were used during training:
|
| 40 |
-
- learning_rate:
|
| 41 |
- train_batch_size: 32
|
| 42 |
- eval_batch_size: 32
|
| 43 |
- seed: 42
|
|
@@ -50,36 +50,36 @@ The following hyperparameters were used during training:
|
|
| 50 |
|
| 51 |
| Training Loss | Epoch | Step | Validation Loss | Wer |
|
| 52 |
|:-------------:|:-----:|:----:|:---------------:|:------:|
|
| 53 |
-
|
|
| 54 |
-
|
|
| 55 |
-
|
|
| 56 |
-
|
|
| 57 |
-
|
|
| 58 |
-
|
|
| 59 |
-
|
|
| 60 |
-
|
|
| 61 |
-
|
|
| 62 |
-
|
|
| 63 |
-
|
|
| 64 |
-
|
|
| 65 |
-
|
|
| 66 |
-
|
|
| 67 |
-
|
|
| 68 |
-
|
|
| 69 |
-
|
|
| 70 |
-
|
|
| 71 |
-
|
|
| 72 |
-
|
|
| 73 |
-
|
|
| 74 |
-
|
|
| 75 |
-
|
|
| 76 |
-
|
|
| 77 |
-
|
|
| 78 |
-
|
|
| 79 |
-
|
|
| 80 |
-
|
|
| 81 |
-
|
|
| 82 |
-
|
|
| 83 |
|
| 84 |
|
| 85 |
### Framework versions
|
|
|
|
| 17 |
|
| 18 |
This model is a fine-tuned version of [facebook/wav2vec2-base-960h](https://huggingface.co/facebook/wav2vec2-base-960h) on an unknown dataset.
|
| 19 |
It achieves the following results on the evaluation set:
|
| 20 |
+
- Loss: 135.5781
|
| 21 |
+
- Wer: 0.0427
|
| 22 |
|
| 23 |
## Model description
|
| 24 |
|
|
|
|
| 37 |
### Training hyperparameters
|
| 38 |
|
| 39 |
The following hyperparameters were used during training:
|
| 40 |
+
- learning_rate: 8e-05
|
| 41 |
- train_batch_size: 32
|
| 42 |
- eval_batch_size: 32
|
| 43 |
- seed: 42
|
|
|
|
| 50 |
|
| 51 |
| Training Loss | Epoch | Step | Validation Loss | Wer |
|
| 52 |
|:-------------:|:-----:|:----:|:---------------:|:------:|
|
| 53 |
+
| 1518.9794 | 1.0 | 168 | 1000.8097 | 0.4552 |
|
| 54 |
+
| 1028.341 | 2.0 | 336 | 779.6321 | 0.3719 |
|
| 55 |
+
| 820.663 | 3.0 | 504 | 659.3882 | 0.2988 |
|
| 56 |
+
| 718.5459 | 4.0 | 672 | 516.9663 | 0.2303 |
|
| 57 |
+
| 606.0076 | 5.0 | 840 | 421.7630 | 0.1998 |
|
| 58 |
+
| 535.3864 | 6.0 | 1008 | 478.5203 | 0.2051 |
|
| 59 |
+
| 466.5894 | 7.0 | 1176 | 440.6602 | 0.1739 |
|
| 60 |
+
| 432.4227 | 8.0 | 1344 | 294.9408 | 0.1323 |
|
| 61 |
+
| 373.2972 | 9.0 | 1512 | 261.7947 | 0.1122 |
|
| 62 |
+
| 355.762 | 10.0 | 1680 | 315.7706 | 0.1300 |
|
| 63 |
+
| 314.1884 | 11.0 | 1848 | 350.8355 | 0.1181 |
|
| 64 |
+
| 288.5761 | 12.0 | 2016 | 310.4185 | 0.1201 |
|
| 65 |
+
| 291.121 | 13.0 | 2184 | 255.1681 | 0.0876 |
|
| 66 |
+
| 236.6435 | 14.0 | 2352 | 240.4549 | 0.0873 |
|
| 67 |
+
| 219.9664 | 15.0 | 2520 | 237.7248 | 0.0922 |
|
| 68 |
+
| 201.4798 | 16.0 | 2688 | 162.6640 | 0.0619 |
|
| 69 |
+
| 199.2839 | 17.0 | 2856 | 232.3585 | 0.0800 |
|
| 70 |
+
| 194.1537 | 18.0 | 3024 | 215.3707 | 0.0772 |
|
| 71 |
+
| 177.814 | 19.0 | 3192 | 171.7732 | 0.0589 |
|
| 72 |
+
| 166.7409 | 20.0 | 3360 | 166.2487 | 0.0597 |
|
| 73 |
+
| 169.7996 | 21.0 | 3528 | 135.5038 | 0.0546 |
|
| 74 |
+
| 153.8049 | 22.0 | 3696 | 150.6883 | 0.0518 |
|
| 75 |
+
| 143.4673 | 23.0 | 3864 | 179.0132 | 0.0541 |
|
| 76 |
+
| 147.514 | 24.0 | 4032 | 131.5579 | 0.0419 |
|
| 77 |
+
| 138.0108 | 25.0 | 4200 | 154.8247 | 0.0493 |
|
| 78 |
+
| 142.9634 | 26.0 | 4368 | 165.7421 | 0.0586 |
|
| 79 |
+
| 123.1378 | 27.0 | 4536 | 160.7584 | 0.0472 |
|
| 80 |
+
| 129.9836 | 28.0 | 4704 | 104.9703 | 0.0366 |
|
| 81 |
+
| 113.1207 | 29.0 | 4872 | 172.9598 | 0.0490 |
|
| 82 |
+
| 110.3937 | 30.0 | 5040 | 135.5781 | 0.0427 |
|
| 83 |
|
| 84 |
|
| 85 |
### Framework versions
|
config.json
CHANGED
|
@@ -9,7 +9,7 @@
|
|
| 9 |
"architectures": [
|
| 10 |
"Wav2Vec2ForCTC"
|
| 11 |
],
|
| 12 |
-
"attention_dropout": 0.
|
| 13 |
"bos_token_id": 1,
|
| 14 |
"classifier_proj_size": 256,
|
| 15 |
"codevector_dim": 256,
|
|
@@ -50,12 +50,12 @@
|
|
| 50 |
"feat_extract_activation": "gelu",
|
| 51 |
"feat_extract_dropout": 0.0,
|
| 52 |
"feat_extract_norm": "group",
|
| 53 |
-
"feat_proj_dropout": 0.
|
| 54 |
"feat_quantizer_dropout": 0.0,
|
| 55 |
-
"final_dropout": 0.
|
| 56 |
"gradient_checkpointing": false,
|
| 57 |
"hidden_act": "gelu",
|
| 58 |
-
"hidden_dropout": 0.
|
| 59 |
"hidden_dropout_prob": 0.1,
|
| 60 |
"hidden_size": 768,
|
| 61 |
"initializer_range": 0.02,
|
|
|
|
| 9 |
"architectures": [
|
| 10 |
"Wav2Vec2ForCTC"
|
| 11 |
],
|
| 12 |
+
"attention_dropout": 0.15,
|
| 13 |
"bos_token_id": 1,
|
| 14 |
"classifier_proj_size": 256,
|
| 15 |
"codevector_dim": 256,
|
|
|
|
| 50 |
"feat_extract_activation": "gelu",
|
| 51 |
"feat_extract_dropout": 0.0,
|
| 52 |
"feat_extract_norm": "group",
|
| 53 |
+
"feat_proj_dropout": 0.15,
|
| 54 |
"feat_quantizer_dropout": 0.0,
|
| 55 |
+
"final_dropout": 0.15,
|
| 56 |
"gradient_checkpointing": false,
|
| 57 |
"hidden_act": "gelu",
|
| 58 |
+
"hidden_dropout": 0.15,
|
| 59 |
"hidden_dropout_prob": 0.1,
|
| 60 |
"hidden_size": 768,
|
| 61 |
"initializer_range": 0.02,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377611120
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8fe0a83b85190e9c5df256386b63f109df3c6d5bc2d19218bec38e8582c02ab
|
| 3 |
size 377611120
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6cb190c3f93a398db49cf968b1143a0a2d6ea9ba39aea61f61608d6d31dfaa5a
|
| 3 |
size 5176
|