ahmadmwali commited on
Commit
ceddb6b
·
verified ·
1 Parent(s): 2ed6a83

End of training

Browse files
README.md CHANGED
@@ -20,12 +20,12 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  This model is a fine-tuned version of [facebook/m2m100_418M](https://huggingface.co/facebook/m2m100_418M) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
- - Bleu: 0.8249
24
- - F1: 0.9232
25
- - Wer: 0.0832
26
- - Cer: 0.0268
27
  - Meteor: 0.9148
28
- - Loss: 6.1040
29
 
30
  ## Model description
31
 
@@ -57,9 +57,9 @@ The following hyperparameters were used during training:
57
 
58
  | Training Loss | Epoch | Step | Bleu | F1 | Wer | Cer | Meteor | Validation Loss |
59
  |:-------------:|:-----:|:-----:|:------:|:------:|:------:|:------:|:------:|:---------------:|
60
- | 6.1256 | 1.0 | 12500 | 0.7995 | 0.9118 | 0.0952 | 0.0304 | 0.9020 | 6.1150 |
61
- | 6.1178 | 2.0 | 25000 | 0.8172 | 0.9199 | 0.0870 | 0.0282 | 0.9109 | 6.1073 |
62
- | 6.1012 | 3.0 | 37500 | 0.8249 | 0.9232 | 0.0832 | 0.0268 | 0.9148 | 6.1040 |
63
 
64
 
65
  ### Framework versions
 
20
 
21
  This model is a fine-tuned version of [facebook/m2m100_418M](https://huggingface.co/facebook/m2m100_418M) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Bleu: 0.8239
24
+ - F1: 0.9229
25
+ - Wer: 0.0824
26
+ - Cer: 0.0262
27
  - Meteor: 0.9148
28
+ - Loss: 6.1042
29
 
30
  ## Model description
31
 
 
57
 
58
  | Training Loss | Epoch | Step | Bleu | F1 | Wer | Cer | Meteor | Validation Loss |
59
  |:-------------:|:-----:|:-----:|:------:|:------:|:------:|:------:|:------:|:---------------:|
60
+ | 6.1256 | 1.0 | 12500 | 0.7992 | 0.9121 | 0.0950 | 0.0308 | 0.9022 | 6.1147 |
61
+ | 6.1187 | 2.0 | 25000 | 0.8172 | 0.9198 | 0.0868 | 0.0281 | 0.9112 | 6.1067 |
62
+ | 6.0999 | 3.0 | 37500 | 0.8239 | 0.9229 | 0.0824 | 0.0262 | 0.9148 | 6.1042 |
63
 
64
 
65
  ### Framework versions
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df925e911da24f615a4d68b215c318fa2965e08757af878cf2d246e3c44f46fc
3
  size 9457520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:623178331108dd55759c25e0b0c82afe9518f980c8d9591c61f9af36582850cc
3
  size 9457520
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_bleu": 0.824917705791878,
4
- "eval_cer": 0.02681490368523881,
5
- "eval_f1": 0.923196495238835,
6
- "eval_loss": 6.103950500488281,
7
- "eval_meteor": 0.9148204705294067,
8
- "eval_runtime": 588.9014,
9
- "eval_samples_per_second": 8.49,
10
- "eval_steps_per_second": 0.267,
11
- "eval_wer": 0.08322672667667196,
12
  "total_flos": 6.544636730199245e+17,
13
- "train_loss": 6.1357289762369795,
14
- "train_runtime": 6359.0647,
15
- "train_samples_per_second": 188.702,
16
- "train_steps_per_second": 5.897
17
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_bleu": 0.823943051750742,
4
+ "eval_cer": 0.02620693733959594,
5
+ "eval_f1": 0.9229451426010926,
6
+ "eval_loss": 6.104158401489258,
7
+ "eval_meteor": 0.914842353945872,
8
+ "eval_runtime": 585.9186,
9
+ "eval_samples_per_second": 8.534,
10
+ "eval_steps_per_second": 0.268,
11
+ "eval_wer": 0.08241131435383867,
12
  "total_flos": 6.544636730199245e+17,
13
+ "train_loss": 6.135559250488281,
14
+ "train_runtime": 6379.9802,
15
+ "train_samples_per_second": 188.084,
16
+ "train_steps_per_second": 5.878
17
  }
eval_final_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_bleu": 0.824917705791878,
4
- "eval_cer": 0.02681490368523881,
5
- "eval_f1": 0.923196495238835,
6
- "eval_loss": 6.103950500488281,
7
- "eval_meteor": 0.9148204705294067,
8
- "eval_runtime": 588.9014,
9
- "eval_samples_per_second": 8.49,
10
- "eval_steps_per_second": 0.267,
11
- "eval_wer": 0.08322672667667196
12
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_bleu": 0.823943051750742,
4
+ "eval_cer": 0.02620693733959594,
5
+ "eval_f1": 0.9229451426010926,
6
+ "eval_loss": 6.104158401489258,
7
+ "eval_meteor": 0.914842353945872,
8
+ "eval_runtime": 585.9186,
9
+ "eval_samples_per_second": 8.534,
10
+ "eval_steps_per_second": 0.268,
11
+ "eval_wer": 0.08241131435383867
12
  }
logs/events.out.tfevents.1748594726.c1279aa5eb8f.2392797.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dfdd73098d373d0a0a80419a87b84bd5fede6bdbe4d461c073d47b77297d5ab
3
+ size 169393
logs/events.out.tfevents.1748601691.c1279aa5eb8f.2392797.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73a5035d517561a4f79c0b6359c933fc48f844d074ceb09feb278c85c55a0ac5
3
+ size 607
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "total_flos": 6.544636730199245e+17,
4
- "train_loss": 6.1357289762369795,
5
- "train_runtime": 6359.0647,
6
- "train_samples_per_second": 188.702,
7
- "train_steps_per_second": 5.897
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "total_flos": 6.544636730199245e+17,
4
+ "train_loss": 6.135559250488281,
5
+ "train_runtime": 6379.9802,
6
+ "train_samples_per_second": 188.084,
7
+ "train_steps_per_second": 5.878
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c4657d63dc5ae7140d37135453e97b70890bf594b38d44b5f03bd7e75012e4c
3
  size 7864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36abf2cd69f7eda3a79614183ba40bf29c0001c076aae486529f711fd65d9ab9
3
  size 7864