MonicaMalvarez commited on
Commit
f812836
·
verified ·
1 Parent(s): 15996b7

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "facebook/mbart-large-50",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
 
1
  {
2
+ "_name_or_path": "laureanadcastro/mbart-neutralization",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c577ea47e6185521c28aae60e566fde97a9391ac1505189022dc7b470ec76c40
3
  size 2444578688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caeae2057f9a51c9f759b6607450b1fd1ebe4502321249c2e4222a23206813fd
3
  size 2444578688
special_tokens_map.json CHANGED
@@ -53,9 +53,27 @@
53
  "gl_ES",
54
  "sl_SI"
55
  ],
56
- "bos_token": "<s>",
57
- "cls_token": "<s>",
58
- "eos_token": "</s>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59
  "mask_token": {
60
  "content": "<mask>",
61
  "lstrip": true,
@@ -63,7 +81,25 @@
63
  "rstrip": false,
64
  "single_word": false
65
  },
66
- "pad_token": "<pad>",
67
- "sep_token": "</s>",
68
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  }
 
53
  "gl_ES",
54
  "sl_SI"
55
  ],
56
+ "bos_token": {
57
+ "content": "<s>",
58
+ "lstrip": false,
59
+ "normalized": false,
60
+ "rstrip": false,
61
+ "single_word": false
62
+ },
63
+ "cls_token": {
64
+ "content": "<s>",
65
+ "lstrip": false,
66
+ "normalized": false,
67
+ "rstrip": false,
68
+ "single_word": false
69
+ },
70
+ "eos_token": {
71
+ "content": "</s>",
72
+ "lstrip": false,
73
+ "normalized": false,
74
+ "rstrip": false,
75
+ "single_word": false
76
+ },
77
  "mask_token": {
78
  "content": "<mask>",
79
  "lstrip": true,
 
81
  "rstrip": false,
82
  "single_word": false
83
  },
84
+ "pad_token": {
85
+ "content": "<pad>",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false
90
+ },
91
+ "sep_token": {
92
+ "content": "</s>",
93
+ "lstrip": false,
94
+ "normalized": false,
95
+ "rstrip": false,
96
+ "single_word": false
97
+ },
98
+ "unk_token": {
99
+ "content": "<unk>",
100
+ "lstrip": false,
101
+ "normalized": false,
102
+ "rstrip": false,
103
+ "single_word": false
104
+ }
105
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef126060ddcab67250020d3e4fff2150e3946ba9e7cea24b2a18dd969e0469da
3
- size 17110019
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e05149e476a633a1848f49e8aab40803980b7a22e1a0829229378759c819049
3
+ size 17094668
tokenizer_config.json CHANGED
@@ -512,17 +512,21 @@
512
  "sl_SI"
513
  ],
514
  "bos_token": "<s>",
515
- "clean_up_tokenization_spaces": false,
516
  "cls_token": "<s>",
517
  "eos_token": "</s>",
518
  "extra_special_tokens": {},
519
  "mask_token": "<mask>",
 
520
  "model_max_length": 1024,
521
  "pad_token": "<pad>",
522
  "sep_token": "</s>",
523
  "sp_model_kwargs": {},
524
  "src_lang": "en_XX",
 
525
  "tgt_lang": null,
526
  "tokenizer_class": "MBart50Tokenizer",
 
 
527
  "unk_token": "<unk>"
528
  }
 
512
  "sl_SI"
513
  ],
514
  "bos_token": "<s>",
515
+ "clean_up_tokenization_spaces": true,
516
  "cls_token": "<s>",
517
  "eos_token": "</s>",
518
  "extra_special_tokens": {},
519
  "mask_token": "<mask>",
520
+ "max_length": 128,
521
  "model_max_length": 1024,
522
  "pad_token": "<pad>",
523
  "sep_token": "</s>",
524
  "sp_model_kwargs": {},
525
  "src_lang": "en_XX",
526
+ "stride": 0,
527
  "tgt_lang": null,
528
  "tokenizer_class": "MBart50Tokenizer",
529
+ "truncation_side": "right",
530
+ "truncation_strategy": "longest_first",
531
  "unk_token": "<unk>"
532
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:445b4dc48f51c7bb725fcbd8223fad69c5d0a91ecb8c43cf0d56b652f2045751
3
- size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcb2c64f3ff64e7d89e570c05ca18e3f3bf4a4af13ecda7c829b6679ca56f3e8
3
+ size 5496