Must Erhang commited on
Commit
e81d975
·
1 Parent(s): bc5afce

drop token

Browse files
Files changed (2) hide show
  1. tokenizer.json +0 -0
  2. tokenizer_config.json +0 -9
tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json DELETED
@@ -1,9 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "bos_token": "<|endoftext|>",
4
- "clean_up_tokenization_spaces": true,
5
- "eos_token": "<|endoftext|>",
6
- "model_max_length": 1024,
7
- "tokenizer_class": "GPT2Tokenizer",
8
- "unk_token": "<|endoftext|>"
9
- }