Coco-18 commited on
Commit
4fb829c
·
verified ·
1 Parent(s): 966ea14

Upload 9 files

Browse files
config.json CHANGED
@@ -13,7 +13,7 @@
13
  "decoder_layerdrop": 0.0,
14
  "decoder_layers": 6,
15
  "decoder_start_token_id": 57575,
16
- "decoder_vocab_size": 57578,
17
  "dropout": 0.1,
18
  "encoder_attention_heads": 16,
19
  "encoder_ffn_dim": 4096,
@@ -34,7 +34,7 @@
34
  "share_encoder_decoder_embeddings": true,
35
  "static_position_embeddings": true,
36
  "torch_dtype": "float32",
37
- "transformers_version": "4.50.2",
38
  "use_cache": true,
39
- "vocab_size": 57578
40
  }
 
13
  "decoder_layerdrop": 0.0,
14
  "decoder_layers": 6,
15
  "decoder_start_token_id": 57575,
16
+ "decoder_vocab_size": 57576,
17
  "dropout": 0.1,
18
  "encoder_attention_heads": 16,
19
  "encoder_ffn_dim": 4096,
 
34
  "share_encoder_decoder_embeddings": true,
35
  "static_position_embeddings": true,
36
  "torch_dtype": "float32",
37
+ "transformers_version": "4.51.0",
38
  "use_cache": true,
39
+ "vocab_size": 57576
40
  }
generation_config.json CHANGED
@@ -6,10 +6,15 @@
6
  ],
7
  "bos_token_id": 0,
8
  "decoder_start_token_id": 57575,
 
 
9
  "eos_token_id": 1006,
10
  "forced_eos_token_id": 1006,
11
  "max_length": 512,
 
12
  "num_beams": 4,
13
  "pad_token_id": 57575,
14
- "transformers_version": "4.50.2"
 
 
15
  }
 
6
  ],
7
  "bos_token_id": 0,
8
  "decoder_start_token_id": 57575,
9
+ "do_sample": true,
10
+ "early_stopping": true,
11
  "eos_token_id": 1006,
12
  "forced_eos_token_id": 1006,
13
  "max_length": 512,
14
+ "no_repeat_ngram_size": 2,
15
  "num_beams": 4,
16
  "pad_token_id": 57575,
17
+ "repetition_penalty": 1.5,
18
+ "top_p": 0.95,
19
+ "transformers_version": "4.51.0"
20
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8d59c11a4b535fa4aced97917c71655e58797001d9d3e5f59cba184932e2a24
3
- size 941528920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20dbceaa1e298897c2bee1815cf974f29dc6adf0abbd7838a743e447dc2c4c80
3
+ size 941520720
special_tokens_map.json CHANGED
@@ -1,20 +1,4 @@
1
  {
2
- "additional_special_tokens": [
3
- {
4
- "content": ">>pam<<",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false
9
- },
10
- {
11
- "content": ">>eng<<",
12
- "lstrip": false,
13
- "normalized": false,
14
- "rstrip": false,
15
- "single_word": false
16
- }
17
- ],
18
  "eos_token": "</s>",
19
  "pad_token": "<pad>",
20
  "unk_token": "<unk>"
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "eos_token": "</s>",
3
  "pad_token": "<pad>",
4
  "unk_token": "<unk>"
tokenizer_config.json CHANGED
@@ -1,59 +1,13 @@
1
  {
2
- "added_tokens_decoder": {
3
- "1006": {
4
- "content": "</s>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false,
9
- "special": true
10
- },
11
- "1264": {
12
- "content": "<unk>",
13
- "lstrip": false,
14
- "normalized": false,
15
- "rstrip": false,
16
- "single_word": false,
17
- "special": true
18
- },
19
- "57575": {
20
- "content": "<pad>",
21
- "lstrip": false,
22
- "normalized": false,
23
- "rstrip": false,
24
- "single_word": false,
25
- "special": true
26
- },
27
- "57576": {
28
- "content": ">>pam<<",
29
- "lstrip": false,
30
- "normalized": false,
31
- "rstrip": false,
32
- "single_word": false,
33
- "special": true
34
- },
35
- "57577": {
36
- "content": ">>eng<<",
37
- "lstrip": false,
38
- "normalized": false,
39
- "rstrip": false,
40
- "single_word": false,
41
- "special": true
42
- }
43
- },
44
- "additional_special_tokens": [
45
- ">>pam<<",
46
- ">>eng<<"
47
- ],
48
- "clean_up_tokenization_spaces": false,
49
  "eos_token": "</s>",
50
- "extra_special_tokens": {},
51
- "model_max_length": 512,
52
  "pad_token": "<pad>",
53
- "separate_vocabs": false,
54
- "source_lang": "phi",
55
  "sp_model_kwargs": {},
56
- "target_lang": "en",
57
- "tokenizer_class": "MarianTokenizer",
58
- "unk_token": "<unk>"
59
- }
 
 
1
  {
2
+ "source_lang": "phi",
3
+ "target_lang": "en",
4
+ "unk_token": "<unk>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "eos_token": "</s>",
 
 
6
  "pad_token": "<pad>",
7
+ "model_max_length": 512,
 
8
  "sp_model_kwargs": {},
9
+ "separate_vocabs": false,
10
+ "special_tokens_map_file": null,
11
+ "name_or_path": "./improved-model-pam-en/best-model-27.35",
12
+ "tokenizer_class": "MarianTokenizer"
13
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dbc0544b6a625fab1adef53246a9f7bfb597b9f4356b5001910de6b596f6fbc
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae046995af2fab85c42eb485bd155c913cd14585cc6e5845ca7fe7e45d23b59b
3
  size 5496