aoiandroid commited on
Commit
c64b6bd
·
verified ·
1 Parent(s): 5e2e7cd

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/README.md +26 -0
  2. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/config.json +55 -0
  3. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/generation_config.json +16 -0
  4. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/special_tokens_map.json +5 -0
  5. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/tokenizer.json +0 -0
  6. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/tokenizer_config.json +39 -0
  7. Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/vocab.json +0 -0
  8. Helsinki-NLP-opus-mt-ROMANCE-en/README.md +25 -0
  9. Helsinki-NLP-opus-mt-ROMANCE-en/config.json +55 -0
  10. Helsinki-NLP-opus-mt-ROMANCE-en/generation_config.json +16 -0
  11. Helsinki-NLP-opus-mt-ROMANCE-en/special_tokens_map.json +5 -0
  12. Helsinki-NLP-opus-mt-ROMANCE-en/tokenizer.json +0 -0
  13. Helsinki-NLP-opus-mt-ROMANCE-en/tokenizer_config.json +39 -0
  14. Helsinki-NLP-opus-mt-ROMANCE-en/vocab.json +0 -0
  15. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/README.md +26 -0
  16. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/config.json +55 -0
  17. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/decoder_model_merged.onnx +3 -0
  18. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/encoder_model.onnx +3 -0
  19. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/generation_config.json +16 -0
  20. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/special_tokens_map.json +5 -0
  21. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/tokenizer.json +0 -0
  22. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/tokenizer_config.json +39 -0
  23. Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/vocab.json +0 -0
  24. Helsinki-NLP-opus-mt-aav-en/decoder_model.onnx +3 -0
  25. Helsinki-NLP-opus-mt-aav-en/decoder_model_merged.onnx +3 -0
  26. Helsinki-NLP-opus-mt-aav-en/decoder_with_past_model.onnx +3 -0
  27. Helsinki-NLP-opus-mt-aav-en/encoder_model.onnx +3 -0
  28. Helsinki-NLP-opus-mt-aav-en/source.spm +3 -0
  29. Helsinki-NLP-opus-mt-aav-en/target.spm +3 -0
  30. Helsinki-NLP-opus-mt-aed-es/decoder_model.onnx +3 -0
  31. Helsinki-NLP-opus-mt-aed-es/decoder_model_merged.onnx +3 -0
  32. Helsinki-NLP-opus-mt-aed-es/decoder_with_past_model.onnx +3 -0
  33. Helsinki-NLP-opus-mt-aed-es/encoder_model.onnx +3 -0
  34. Helsinki-NLP-opus-mt-aed-es/source.spm +3 -0
  35. Helsinki-NLP-opus-mt-aed-es/target.spm +3 -0
  36. Helsinki-NLP-opus-mt-af-de/decoder_model.onnx +3 -0
  37. Helsinki-NLP-opus-mt-af-de/decoder_model_merged.onnx +3 -0
  38. Helsinki-NLP-opus-mt-af-de/decoder_with_past_model.onnx +3 -0
  39. Helsinki-NLP-opus-mt-af-de/encoder_model.onnx +3 -0
  40. Helsinki-NLP-opus-mt-af-de/source.spm +3 -0
  41. Helsinki-NLP-opus-mt-af-de/target.spm +3 -0
  42. Helsinki-NLP-opus-mt-af-en/decoder_model.onnx +3 -0
  43. Helsinki-NLP-opus-mt-af-en/decoder_model_merged.onnx +3 -0
  44. Helsinki-NLP-opus-mt-af-en/decoder_with_past_model.onnx +3 -0
  45. Helsinki-NLP-opus-mt-af-en/encoder_model.onnx +3 -0
  46. Helsinki-NLP-opus-mt-af-en/source.spm +3 -0
  47. Helsinki-NLP-opus-mt-af-en/target.spm +3 -0
  48. Helsinki-NLP-opus-mt-af-eo/decoder_model.onnx +3 -0
  49. Helsinki-NLP-opus-mt-af-eo/decoder_model_merged.onnx +3 -0
  50. Helsinki-NLP-opus-mt-af-eo/decoder_with_past_model.onnx +3 -0
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/README.md ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - translation
4
+ license: apache-2.0
5
+ ---
6
+
7
+ ### opus-mt-NORTH_EU-NORTH_EU
8
+
9
+ * source languages: de,nl,fy,af,da,fo,is,no,nb,nn,sv
10
+ * target languages: de,nl,fy,af,da,fo,is,no,nb,nn,sv
11
+ * OPUS readme: [de+nl+fy+af+da+fo+is+no+nb+nn+sv-de+nl+fy+af+da+fo+is+no+nb+nn+sv](https://github.com/Helsinki-NLP/OPUS-MT-train/blob/master/models/de+nl+fy+af+da+fo+is+no+nb+nn+sv-de+nl+fy+af+da+fo+is+no+nb+nn+sv/README.md)
12
+
13
+ * dataset: opus
14
+ * model: transformer-align
15
+ * pre-processing: normalization + SentencePiece
16
+ * a sentence initial language token is required in the form of `>>id<<` (id = valid target language ID)
17
+ * download original weights: [opus-2020-01-15.zip](https://object.pouta.csc.fi/OPUS-MT-models/de+nl+fy+af+da+fo+is+no+nb+nn+sv-de+nl+fy+af+da+fo+is+no+nb+nn+sv/opus-2020-01-15.zip)
18
+ * test set translations: [opus-2020-01-15.test.txt](https://object.pouta.csc.fi/OPUS-MT-models/de+nl+fy+af+da+fo+is+no+nb+nn+sv-de+nl+fy+af+da+fo+is+no+nb+nn+sv/opus-2020-01-15.test.txt)
19
+ * test set scores: [opus-2020-01-15.eval.txt](https://object.pouta.csc.fi/OPUS-MT-models/de+nl+fy+af+da+fo+is+no+nb+nn+sv-de+nl+fy+af+da+fo+is+no+nb+nn+sv/opus-2020-01-15.eval.txt)
20
+
21
+ ## Benchmarks
22
+
23
+ | testset | BLEU | chr-F |
24
+ |-----------------------|-------|-------|
25
+ | Tatoeba.de.sv | 48.1 | 0.663 |
26
+
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.0,
3
+ "activation_function": "swish",
4
+ "add_bias_logits": false,
5
+ "add_final_layer_norm": false,
6
+ "architectures": [
7
+ "MarianMTModel"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "bos_token_id": 0,
11
+ "classif_dropout": 0.0,
12
+ "classifier_dropout": 0.0,
13
+ "d_model": 512,
14
+ "decoder_attention_heads": 8,
15
+ "decoder_ffn_dim": 2048,
16
+ "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 6,
18
+ "decoder_start_token_id": 58011,
19
+ "decoder_vocab_size": 58012,
20
+ "dropout": 0.1,
21
+ "encoder_attention_heads": 8,
22
+ "encoder_ffn_dim": 2048,
23
+ "encoder_layerdrop": 0.0,
24
+ "encoder_layers": 6,
25
+ "eos_token_id": 0,
26
+ "forced_eos_token_id": 0,
27
+ "id2label": {
28
+ "0": "LABEL_0",
29
+ "1": "LABEL_1",
30
+ "2": "LABEL_2"
31
+ },
32
+ "init_std": 0.02,
33
+ "is_encoder_decoder": true,
34
+ "is_transformers_support_available": true,
35
+ "label2id": {
36
+ "LABEL_0": 0,
37
+ "LABEL_1": 1,
38
+ "LABEL_2": 2
39
+ },
40
+ "max_length": null,
41
+ "max_position_embeddings": 512,
42
+ "model_type": "marian",
43
+ "normalize_before": false,
44
+ "normalize_embedding": false,
45
+ "num_beams": null,
46
+ "num_hidden_layers": 6,
47
+ "pad_token_id": 58011,
48
+ "scale_embedding": true,
49
+ "share_encoder_decoder_embeddings": true,
50
+ "static_position_embeddings": true,
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.53.3",
53
+ "use_cache": true,
54
+ "vocab_size": 58012
55
+ }
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bad_words_ids": [
3
+ [
4
+ 58011
5
+ ]
6
+ ],
7
+ "bos_token_id": 0,
8
+ "decoder_start_token_id": 58011,
9
+ "eos_token_id": 0,
10
+ "forced_eos_token_id": 0,
11
+ "max_length": 512,
12
+ "num_beams": 4,
13
+ "pad_token_id": 58011,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.53.3"
16
+ }
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/tokenizer_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "</s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<unk>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "58011": {
20
+ "content": "<pad>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ }
27
+ },
28
+ "clean_up_tokenization_spaces": false,
29
+ "eos_token": "</s>",
30
+ "extra_special_tokens": {},
31
+ "model_max_length": 512,
32
+ "pad_token": "<pad>",
33
+ "separate_vocabs": false,
34
+ "source_lang": "de+nl+fy+af+da+fo+is+no+nb+nn+sv",
35
+ "sp_model_kwargs": {},
36
+ "target_lang": "de+nl+fy+af+da+fo+is+no+nb+nn+sv",
37
+ "tokenizer_class": "MarianTokenizer",
38
+ "unk_token": "<unk>"
39
+ }
Helsinki-NLP-opus-mt-NORTH_EU-NORTH_EU/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
Helsinki-NLP-opus-mt-ROMANCE-en/README.md ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - translation
4
+ license: apache-2.0
5
+ ---
6
+
7
+ ### opus-mt-ROMANCE-en
8
+
9
+ * source languages: fr,fr_BE,fr_CA,fr_FR,wa,frp,oc,ca,rm,lld,fur,lij,lmo,es,es_AR,es_CL,es_CO,es_CR,es_DO,es_EC,es_ES,es_GT,es_HN,es_MX,es_NI,es_PA,es_PE,es_PR,es_SV,es_UY,es_VE,pt,pt_br,pt_BR,pt_PT,gl,lad,an,mwl,it,it_IT,co,nap,scn,vec,sc,ro,la
10
+ * target languages: en
11
+ * OPUS readme: [fr+fr_BE+fr_CA+fr_FR+wa+frp+oc+ca+rm+lld+fur+lij+lmo+es+es_AR+es_CL+es_CO+es_CR+es_DO+es_EC+es_ES+es_GT+es_HN+es_MX+es_NI+es_PA+es_PE+es_PR+es_SV+es_UY+es_VE+pt+pt_br+pt_BR+pt_PT+gl+lad+an+mwl+it+it_IT+co+nap+scn+vec+sc+ro+la-en](https://github.com/Helsinki-NLP/OPUS-MT-train/blob/master/models/fr+fr_BE+fr_CA+fr_FR+wa+frp+oc+ca+rm+lld+fur+lij+lmo+es+es_AR+es_CL+es_CO+es_CR+es_DO+es_EC+es_ES+es_GT+es_HN+es_MX+es_NI+es_PA+es_PE+es_PR+es_SV+es_UY+es_VE+pt+pt_br+pt_BR+pt_PT+gl+lad+an+mwl+it+it_IT+co+nap+scn+vec+sc+ro+la-en/README.md)
12
+
13
+ * dataset: opus
14
+ * model: transformer
15
+ * pre-processing: normalization + SentencePiece
16
+ * download original weights: [opus-2020-04-01.zip](https://object.pouta.csc.fi/OPUS-MT-models/fr+fr_BE+fr_CA+fr_FR+wa+frp+oc+ca+rm+lld+fur+lij+lmo+es+es_AR+es_CL+es_CO+es_CR+es_DO+es_EC+es_ES+es_GT+es_HN+es_MX+es_NI+es_PA+es_PE+es_PR+es_SV+es_UY+es_VE+pt+pt_br+pt_BR+pt_PT+gl+lad+an+mwl+it+it_IT+co+nap+scn+vec+sc+ro+la-en/opus-2020-04-01.zip)
17
+ * test set translations: [opus-2020-04-01.test.txt](https://object.pouta.csc.fi/OPUS-MT-models/fr+fr_BE+fr_CA+fr_FR+wa+frp+oc+ca+rm+lld+fur+lij+lmo+es+es_AR+es_CL+es_CO+es_CR+es_DO+es_EC+es_ES+es_GT+es_HN+es_MX+es_NI+es_PA+es_PE+es_PR+es_SV+es_UY+es_VE+pt+pt_br+pt_BR+pt_PT+gl+lad+an+mwl+it+it_IT+co+nap+scn+vec+sc+ro+la-en/opus-2020-04-01.test.txt)
18
+ * test set scores: [opus-2020-04-01.eval.txt](https://object.pouta.csc.fi/OPUS-MT-models/fr+fr_BE+fr_CA+fr_FR+wa+frp+oc+ca+rm+lld+fur+lij+lmo+es+es_AR+es_CL+es_CO+es_CR+es_DO+es_EC+es_ES+es_GT+es_HN+es_MX+es_NI+es_PA+es_PE+es_PR+es_SV+es_UY+es_VE+pt+pt_br+pt_BR+pt_PT+gl+lad+an+mwl+it+it_IT+co+nap+scn+vec+sc+ro+la-en/opus-2020-04-01.eval.txt)
19
+
20
+ ## Benchmarks
21
+
22
+ | testset | BLEU | chr-F |
23
+ |-----------------------|-------|-------|
24
+ | Tatoeba.fr.en | 62.2 | 0.750 |
25
+
Helsinki-NLP-opus-mt-ROMANCE-en/config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.0,
3
+ "activation_function": "swish",
4
+ "add_bias_logits": false,
5
+ "add_final_layer_norm": false,
6
+ "architectures": [
7
+ "MarianMTModel"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "bos_token_id": 0,
11
+ "classif_dropout": 0.0,
12
+ "classifier_dropout": 0.0,
13
+ "d_model": 512,
14
+ "decoder_attention_heads": 8,
15
+ "decoder_ffn_dim": 2048,
16
+ "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 6,
18
+ "decoder_start_token_id": 65000,
19
+ "decoder_vocab_size": 65001,
20
+ "dropout": 0.1,
21
+ "encoder_attention_heads": 8,
22
+ "encoder_ffn_dim": 2048,
23
+ "encoder_layerdrop": 0.0,
24
+ "encoder_layers": 6,
25
+ "eos_token_id": 0,
26
+ "forced_eos_token_id": 0,
27
+ "id2label": {
28
+ "0": "LABEL_0",
29
+ "1": "LABEL_1",
30
+ "2": "LABEL_2"
31
+ },
32
+ "init_std": 0.02,
33
+ "is_encoder_decoder": true,
34
+ "is_transformers_support_available": true,
35
+ "label2id": {
36
+ "LABEL_0": 0,
37
+ "LABEL_1": 1,
38
+ "LABEL_2": 2
39
+ },
40
+ "max_length": null,
41
+ "max_position_embeddings": 512,
42
+ "model_type": "marian",
43
+ "normalize_before": false,
44
+ "normalize_embedding": false,
45
+ "num_beams": null,
46
+ "num_hidden_layers": 6,
47
+ "pad_token_id": 65000,
48
+ "scale_embedding": true,
49
+ "share_encoder_decoder_embeddings": true,
50
+ "static_position_embeddings": true,
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.53.3",
53
+ "use_cache": true,
54
+ "vocab_size": 65001
55
+ }
Helsinki-NLP-opus-mt-ROMANCE-en/generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bad_words_ids": [
3
+ [
4
+ 65000
5
+ ]
6
+ ],
7
+ "bos_token_id": 0,
8
+ "decoder_start_token_id": 65000,
9
+ "eos_token_id": 0,
10
+ "forced_eos_token_id": 0,
11
+ "max_length": 512,
12
+ "num_beams": 4,
13
+ "pad_token_id": 65000,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.53.3"
16
+ }
Helsinki-NLP-opus-mt-ROMANCE-en/special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
Helsinki-NLP-opus-mt-ROMANCE-en/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
Helsinki-NLP-opus-mt-ROMANCE-en/tokenizer_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "</s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<unk>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "65000": {
20
+ "content": "<pad>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ }
27
+ },
28
+ "clean_up_tokenization_spaces": false,
29
+ "eos_token": "</s>",
30
+ "extra_special_tokens": {},
31
+ "model_max_length": 512,
32
+ "pad_token": "<pad>",
33
+ "separate_vocabs": false,
34
+ "source_lang": "fr+fr_BE+fr_CA+fr_FR+wa+frp+oc+ca+rm+lld+fur+lij+lmo+es+es_AR+es_CL+es_CO+es_CR+es_DO+es_EC+es_ES+es_GT+es_HN+es_MX+es_NI+es_PA+es_PE+es_PR+es_SV+es_UY+es_VE+pt+pt_br+pt_BR+pt_PT+gl+lad+an+mwl+it+it_IT+co+nap+scn+vec+sc+ro+la",
35
+ "sp_model_kwargs": {},
36
+ "target_lang": "en",
37
+ "tokenizer_class": "MarianTokenizer",
38
+ "unk_token": "<unk>"
39
+ }
Helsinki-NLP-opus-mt-ROMANCE-en/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/README.md ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - translation
4
+ license: apache-2.0
5
+ ---
6
+
7
+ ### opus-mt-SCANDINAVIA-SCANDINAVIA
8
+
9
+ * source languages: da,fo,is,no,nb,nn,sv
10
+ * target languages: da,fo,is,no,nb,nn,sv
11
+ * OPUS readme: [da+fo+is+no+nb+nn+sv-da+fo+is+no+nb+nn+sv](https://github.com/Helsinki-NLP/OPUS-MT-train/blob/master/models/da+fo+is+no+nb+nn+sv-da+fo+is+no+nb+nn+sv/README.md)
12
+
13
+ * dataset: opus
14
+ * model: transformer-align
15
+ * pre-processing: normalization + SentencePiece
16
+ * a sentence initial language token is required in the form of `>>id<<` (id = valid target language ID)
17
+ * download original weights: [opus-2019-12-18.zip](https://object.pouta.csc.fi/OPUS-MT-models/da+fo+is+no+nb+nn+sv-da+fo+is+no+nb+nn+sv/opus-2019-12-18.zip)
18
+ * test set translations: [opus-2019-12-18.test.txt](https://object.pouta.csc.fi/OPUS-MT-models/da+fo+is+no+nb+nn+sv-da+fo+is+no+nb+nn+sv/opus-2019-12-18.test.txt)
19
+ * test set scores: [opus-2019-12-18.eval.txt](https://object.pouta.csc.fi/OPUS-MT-models/da+fo+is+no+nb+nn+sv-da+fo+is+no+nb+nn+sv/opus-2019-12-18.eval.txt)
20
+
21
+ ## Benchmarks
22
+
23
+ | testset | BLEU | chr-F |
24
+ |-----------------------|-------|-------|
25
+ | Tatoeba.da.sv | 69.2 | 0.811 |
26
+
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.0,
3
+ "activation_function": "swish",
4
+ "add_bias_logits": false,
5
+ "add_final_layer_norm": false,
6
+ "architectures": [
7
+ "MarianMTModel"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "bos_token_id": 0,
11
+ "classif_dropout": 0.0,
12
+ "classifier_dropout": 0.0,
13
+ "d_model": 512,
14
+ "decoder_attention_heads": 8,
15
+ "decoder_ffn_dim": 2048,
16
+ "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 6,
18
+ "decoder_start_token_id": 47230,
19
+ "decoder_vocab_size": 47231,
20
+ "dropout": 0.1,
21
+ "encoder_attention_heads": 8,
22
+ "encoder_ffn_dim": 2048,
23
+ "encoder_layerdrop": 0.0,
24
+ "encoder_layers": 6,
25
+ "eos_token_id": 0,
26
+ "forced_eos_token_id": 0,
27
+ "id2label": {
28
+ "0": "LABEL_0",
29
+ "1": "LABEL_1",
30
+ "2": "LABEL_2"
31
+ },
32
+ "init_std": 0.02,
33
+ "is_encoder_decoder": true,
34
+ "is_transformers_support_available": true,
35
+ "label2id": {
36
+ "LABEL_0": 0,
37
+ "LABEL_1": 1,
38
+ "LABEL_2": 2
39
+ },
40
+ "max_length": null,
41
+ "max_position_embeddings": 512,
42
+ "model_type": "marian",
43
+ "normalize_before": false,
44
+ "normalize_embedding": false,
45
+ "num_beams": null,
46
+ "num_hidden_layers": 6,
47
+ "pad_token_id": 47230,
48
+ "scale_embedding": true,
49
+ "share_encoder_decoder_embeddings": true,
50
+ "static_position_embeddings": true,
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.53.3",
53
+ "use_cache": true,
54
+ "vocab_size": 47231
55
+ }
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7f3c6e8efcf5f93188982655c8ef9c4f3fc29cd21dec1906c34a4291888a066
3
+ size 199245826
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95539dc9a9f33a0e5e3e14ea86ac00724d50eec28e9f0c2e8ff32acf2d6d7efd
3
+ size 173509237
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bad_words_ids": [
3
+ [
4
+ 47230
5
+ ]
6
+ ],
7
+ "bos_token_id": 0,
8
+ "decoder_start_token_id": 47230,
9
+ "eos_token_id": 0,
10
+ "forced_eos_token_id": 0,
11
+ "max_length": 512,
12
+ "num_beams": 4,
13
+ "pad_token_id": 47230,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.53.3"
16
+ }
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/tokenizer_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "</s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<unk>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "47230": {
20
+ "content": "<pad>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ }
27
+ },
28
+ "clean_up_tokenization_spaces": false,
29
+ "eos_token": "</s>",
30
+ "extra_special_tokens": {},
31
+ "model_max_length": 512,
32
+ "pad_token": "<pad>",
33
+ "separate_vocabs": false,
34
+ "source_lang": "da+fo+is+no+nb+nn+sv",
35
+ "sp_model_kwargs": {},
36
+ "target_lang": "da+fo+is+no+nb+nn+sv",
37
+ "tokenizer_class": "MarianTokenizer",
38
+ "unk_token": "<unk>"
39
+ }
Helsinki-NLP-opus-mt-SCANDINAVIA-SCANDINAVIA/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
Helsinki-NLP-opus-mt-aav-en/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb921385ed704138739069c343b12529f0a1f16d271c9650d9105318041b2b7b
3
+ size 217138528
Helsinki-NLP-opus-mt-aav-en/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cee791b01f3c4e64b513a6fa308d48d344bed126c83c8e00a176b28d92b6e2d
3
+ size 217319842
Helsinki-NLP-opus-mt-aav-en/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0930e9a38a0cc0654fa0a32d32d2f9e1451bde1681f6bdaea27b62d1e482f282
3
+ size 204508897
Helsinki-NLP-opus-mt-aav-en/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4863f9397f896583c5a1a5425f1d7c2e3fbc2ea64ff08188442e36ba7fe0aa68
3
+ size 191548021
Helsinki-NLP-opus-mt-aav-en/source.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8c4d9428511d3a9d74229e91896dafa2c471ccb2dbf4a979ae8e103c046350c
3
+ size 903675
Helsinki-NLP-opus-mt-aav-en/target.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b1342bd6e880f28bc7f0aa92a4bceff9d503411e54721cf3538a6a48d5c9ae9
3
+ size 808788
Helsinki-NLP-opus-mt-aed-es/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6fdc3d946bb538c5e7303152c442d8e7572294623e63df6f93d8b9e745ed4dc
3
+ size 150625000
Helsinki-NLP-opus-mt-aed-es/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70bd857a8a86da9798f312c9dd783f43c3ec094bacba1fda05705ba07e3f3d8f
3
+ size 150806314
Helsinki-NLP-opus-mt-aed-es/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b366f6d41a4da30076e7dd187fd6bb70561b1637fd3d0dc66883702618a058d0
3
+ size 137995369
Helsinki-NLP-opus-mt-aed-es/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69ce40ab172649c1a190a02d0d339b84f0a9d818e727b702a7979c96f7597368
3
+ size 125164149
Helsinki-NLP-opus-mt-aed-es/source.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a469ba7fd19386b913383b924581ebd61b38761fe611e473e6f4f664d89a807
3
+ size 686452
Helsinki-NLP-opus-mt-aed-es/target.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02567ed5f02824725d8b9a36109eea3b016ecb6fc8ef6807f8100733b4d9eb29
3
+ size 687915
Helsinki-NLP-opus-mt-af-de/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b42a87996428ecda85317b367cc3348f6ddff54533a6f1f234b0315b8a8a51c9
3
+ size 222715864
Helsinki-NLP-opus-mt-af-de/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25142d2387ebb50e456fdb16beda5cfa1da99e332b57e5076cae7b542bd8d77a
3
+ size 222897178
Helsinki-NLP-opus-mt-af-de/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4498eae1deced04e3b43173660cd17f78d7432a2905ede3ca6eed4518d05d678
3
+ size 210086233
Helsinki-NLP-opus-mt-af-de/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4640f60375f32cf58d862511aa360d160cb60faf31bfd4a4f805ccca04dfe71a
3
+ size 197114485
Helsinki-NLP-opus-mt-af-de/source.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56083744a21429cbc330f88631f5011dcc7fa9cbb40d10d482430afb97f8fb3a
3
+ size 829665
Helsinki-NLP-opus-mt-af-de/target.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5015ee4ea5d0f6a85472f116268d7a4f75d27e47350f0769b11e7bd982110e31
3
+ size 848688
Helsinki-NLP-opus-mt-af-en/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:671def97b4e4c389ce54209dd8adad04d2b3cdfecbe81c7aafd657e4242336d0
3
+ size 220023640
Helsinki-NLP-opus-mt-af-en/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a24360eabd8810b852325f12a63f1af165a969b4e5a3a29f27ac790fb3a2ca92
3
+ size 220204954
Helsinki-NLP-opus-mt-af-en/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3517989bf5c54a319ec40666856aa3df212c61cc30e35d7255303c2401a7653b
3
+ size 207394009
Helsinki-NLP-opus-mt-af-en/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69bafd07a2ced3dc762ee8bd719a53f24651829deffa5eacb5703a520fc1629d
3
+ size 194427509
Helsinki-NLP-opus-mt-af-en/source.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c0775610306d171b4f98a32f28024d0b24927d42c305fdb72d03c551908280d
3
+ size 826387
Helsinki-NLP-opus-mt-af-en/target.spm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c32b593efa15f5e22d81934adb3a44fbfa0b6bfc112a2a62ffb1b3c4c164ef33
3
+ size 819272
Helsinki-NLP-opus-mt-af-eo/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:373e3f0612a461555991ccdc70d5ccbad048fab753bdde0e180d4dfe0fb75f4a
3
+ size 117485197
Helsinki-NLP-opus-mt-af-eo/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19b154d6f71f5e930f8946613f24e1366bcfae2beb41c18c94c16286e7f20dbd
3
+ size 117666509
Helsinki-NLP-opus-mt-af-eo/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f196c1ffb35b4547662efa7d1855ce4c050bfabbd90bd88292c3fe17c770c9b
3
+ size 104855566