mouseyy commited on
Commit
5f36875
·
verified ·
1 Parent(s): 1465c2f

Training in progress, step 500

Browse files
README.md CHANGED
@@ -1,20 +1,41 @@
1
  ---
2
  library_name: transformers
 
 
3
  tags:
4
  - generated_from_trainer
5
  datasets:
6
  - common_voice_17_0
 
 
7
  model-index:
8
- - name: best_model_copy
9
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
  should probably proofread and complete it, then remove this comment. -->
14
 
15
- # best_model_copy
16
 
17
- This model was trained from scratch on the common_voice_17_0 dataset.
 
 
 
 
18
 
19
  ## Model description
20
 
@@ -33,7 +54,7 @@ More information needed
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
- - learning_rate: 5e-05
37
  - train_batch_size: 16
38
  - eval_batch_size: 16
39
  - seed: 42
@@ -43,11 +64,21 @@ The following hyperparameters were used during training:
43
  - total_eval_batch_size: 32
44
  - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
45
  - lr_scheduler_type: linear
46
- - training_steps: 20
 
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
50
 
 
 
 
 
 
 
 
 
 
51
 
52
 
53
  ### Framework versions
 
1
  ---
2
  library_name: transformers
3
+ license: apache-2.0
4
+ base_model: facebook/wav2vec2-xls-r-300m
5
  tags:
6
  - generated_from_trainer
7
  datasets:
8
  - common_voice_17_0
9
+ metrics:
10
+ - wer
11
  model-index:
12
+ - name: result_data-1
13
+ results:
14
+ - task:
15
+ name: Automatic Speech Recognition
16
+ type: automatic-speech-recognition
17
+ dataset:
18
+ name: common_voice_17_0
19
+ type: common_voice_17_0
20
+ config: uk
21
+ split: test
22
+ args: uk
23
+ metrics:
24
+ - name: Wer
25
+ type: wer
26
+ value: 0.36512878573450325
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
  should probably proofread and complete it, then remove this comment. -->
31
 
32
+ # result_data-1
33
 
34
+ This model is a fine-tuned version of [facebook/wav2vec2-xls-r-300m](https://huggingface.co/facebook/wav2vec2-xls-r-300m) on the common_voice_17_0 dataset.
35
+ It achieves the following results on the evaluation set:
36
+ - Loss: 0.2220
37
+ - Wer: 0.3651
38
+ - Cer: 0.1691
39
 
40
  ## Model description
41
 
 
54
  ### Training hyperparameters
55
 
56
  The following hyperparameters were used during training:
57
+ - learning_rate: 6.532628754904162e-05
58
  - train_batch_size: 16
59
  - eval_batch_size: 16
60
  - seed: 42
 
64
  - total_eval_batch_size: 32
65
  - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
66
  - lr_scheduler_type: linear
67
+ - lr_scheduler_warmup_steps: 206
68
+ - num_epochs: 7.0
69
  - mixed_precision_training: Native AMP
70
 
71
  ### Training results
72
 
73
+ | Training Loss | Epoch | Step | Validation Loss | Wer | Cer |
74
+ |:-------------:|:------:|:----:|:---------------:|:------:|:------:|
75
+ | 0.6324 | 0.9099 | 1000 | 0.5004 | 0.6083 | 0.2381 |
76
+ | 0.3497 | 1.8198 | 2000 | 0.3087 | 0.4650 | 0.1965 |
77
+ | 0.2642 | 2.7298 | 3000 | 0.2636 | 0.4249 | 0.1841 |
78
+ | 0.2328 | 3.6397 | 4000 | 0.2431 | 0.3960 | 0.1789 |
79
+ | 0.1933 | 4.5496 | 5000 | 0.2289 | 0.3773 | 0.1732 |
80
+ | 0.1783 | 5.4595 | 6000 | 0.2300 | 0.3728 | 0.1711 |
81
+ | 0.1617 | 6.3694 | 7000 | 0.2233 | 0.3637 | 0.1700 |
82
 
83
 
84
  ### Framework versions
all_results.json CHANGED
@@ -8,9 +8,9 @@
8
  "eval_steps_per_second": 0.973,
9
  "eval_wer": 0.36512878573450325,
10
  "total_flos": 5.670215301911177e+19,
11
- "train_loss": 0.0,
12
- "train_runtime": 0.0021,
13
  "train_samples": 35144,
14
- "train_samples_per_second": 303179.869,
15
- "train_steps_per_second": 9474.371
16
  }
 
8
  "eval_steps_per_second": 0.973,
9
  "eval_wer": 0.36512878573450325,
10
  "total_flos": 5.670215301911177e+19,
11
+ "train_loss": 0.6279906528631082,
12
+ "train_runtime": 12613.1325,
13
  "train_samples": 35144,
14
+ "train_samples_per_second": 19.504,
15
+ "train_steps_per_second": 0.61
16
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55e38c1ef5f98213097dc909a322bd8b032c79a0f6b4090e080891ef1c9450a3
3
  size 1261971480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65fd38bdd9eb5d3221f74bcb2b95aae5c0ba46c886054aad54fe7a1f3afacd54
3
  size 1261971480
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 5.670215301911177e+19,
4
- "train_loss": 0.0,
5
- "train_runtime": 0.0021,
6
  "train_samples": 35144,
7
- "train_samples_per_second": 303179.869,
8
- "train_steps_per_second": 9474.371
9
  }
 
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 5.670215301911177e+19,
4
+ "train_loss": 0.6279906528631082,
5
+ "train_runtime": 12613.1325,
6
  "train_samples": 35144,
7
+ "train_samples_per_second": 19.504,
8
+ "train_steps_per_second": 0.61
9
  }
trainer_state.json CHANGED
@@ -614,16 +614,16 @@
614
  "epoch": 7.0,
615
  "step": 7693,
616
  "total_flos": 5.670215301911177e+19,
617
- "train_loss": 0.0,
618
- "train_runtime": 0.0021,
619
- "train_samples_per_second": 303179.869,
620
- "train_steps_per_second": 9474.371
621
  }
622
  ],
623
  "logging_steps": 100,
624
- "max_steps": 20,
625
  "num_input_tokens_seen": 0,
626
- "num_train_epochs": 1,
627
  "save_steps": 1000,
628
  "stateful_callbacks": {
629
  "TrainerControl": {
 
614
  "epoch": 7.0,
615
  "step": 7693,
616
  "total_flos": 5.670215301911177e+19,
617
+ "train_loss": 0.6279906528631082,
618
+ "train_runtime": 12613.1325,
619
+ "train_samples_per_second": 19.504,
620
+ "train_steps_per_second": 0.61
621
  }
622
  ],
623
  "logging_steps": 100,
624
+ "max_steps": 7693,
625
  "num_input_tokens_seen": 0,
626
+ "num_train_epochs": 7,
627
  "save_steps": 1000,
628
  "stateful_callbacks": {
629
  "TrainerControl": {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2dd9a3371207756c14b28a56bce31f16533d1bb9f10f83944d5afdbbdde100f9
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9c3b967339fedd24be512b8d851eeee9701f6ecbd2b3a0a29e3af25125287ba
3
  size 5368