TirkNork commited on
Commit
b1b2708
·
1 Parent(s): 74b3180

Training in progress, epoch 1

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4312ba81161ac250d8f6941528881e2266502edd29bfc4e92d735daf063f4ee8
3
  size 711492725
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:690cb7d2283d2766378b1f90b255f2c3b1e5a26752a47fd62295325a36d7ad7c
3
  size 711492725
runs/May25_04-35-09_6085b8a868f4/events.out.tfevents.1684989311.6085b8a868f4.2893.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:310986e60b3f1540b776d52c8f8e9efc58c3eb326cc25512a18f70f32154e7a3
3
- size 7220
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f150a9a62e7410bf926cda552e82a1d62e6cd628daf02bc3aeab543a42d2387
3
+ size 7897
runs/May25_04-44-49_6085b8a868f4/1684989892.2371247/events.out.tfevents.1684989892.6085b8a868f4.2893.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:137d1263f06602f3720e07a03e667220fc551a2f426b6959ee005ab7dccd208e
3
+ size 5949
runs/May25_04-44-49_6085b8a868f4/events.out.tfevents.1684989892.6085b8a868f4.2893.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14d244b765759e68fa70d2246ef5454ef6333f3725df467340ec7e022a777ef6
3
+ size 4648
special_tokens_map.json CHANGED
@@ -1,7 +1,20 @@
1
  {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED",
5
+ "<_>"
6
+ ],
7
+ "bos_token": "<s>",
8
+ "cls_token": "<s>",
9
+ "eos_token": "</s>",
10
+ "mask_token": {
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "pad_token": "<pad>",
18
+ "sep_token": "</s>",
19
+ "unk_token": "<unk>"
20
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,13 +1,25 @@
1
  {
 
 
 
 
 
 
2
  "clean_up_tokenization_spaces": true,
3
- "cls_token": "[CLS]",
4
- "do_lower_case": false,
5
- "mask_token": "[MASK]",
6
- "model_max_length": 512,
7
- "pad_token": "[PAD]",
8
- "sep_token": "[SEP]",
9
- "strip_accents": null,
10
- "tokenize_chinese_chars": true,
11
- "tokenizer_class": "BertTokenizer",
12
- "unk_token": "[UNK]"
 
 
 
 
 
 
13
  }
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED",
5
+ "<_>"
6
+ ],
7
+ "bos_token": "<s>",
8
  "clean_up_tokenization_spaces": true,
9
+ "cls_token": "<s>",
10
+ "eos_token": "</s>",
11
+ "mask_token": {
12
+ "__type": "AddedToken",
13
+ "content": "<mask>",
14
+ "lstrip": true,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false
18
+ },
19
+ "model_max_length": 1000000000000000019884624838656,
20
+ "pad_token": "<pad>",
21
+ "sep_token": "</s>",
22
+ "sp_model_kwargs": {},
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72cb64b2cdae175f6ed25a1e29581d70d31b58b33af98f43fe3e258d9e58ef70
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:354f345e0c0332e0e61c13122f29cace605feac58fa8631a983751f1e0dbb8af
3
  size 3963