jprivera44 commited on
Commit
36088de
·
verified ·
1 Parent(s): 32bcd8a

Upload checkpoint-4500/tokenizer_config.json with huggingface_hub

Browse files
checkpoint-4500/tokenizer_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<|begin_of_text|>",
4
+ "clean_up_tokenization_spaces": true,
5
+ "eos_token": "<|eot_id|>",
6
+ "from_slow": true,
7
+ "is_local": false,
8
+ "legacy": false,
9
+ "model_input_names": [
10
+ "input_ids",
11
+ "attention_mask"
12
+ ],
13
+ "model_max_length": 131072,
14
+ "pad_token": "<|finetune_right_pad_id|>",
15
+ "padding_side": "right",
16
+ "tokenizer_class": "TokenizersBackend",
17
+ "unk_token": null
18
+ }