when-the-dick-sooo-fire commited on
Commit
90896e7
·
verified ·
1 Parent(s): 07e0aa7

Upload tokenizer

Browse files
Files changed (2) hide show
  1. special_tokens_map.json +7 -0
  2. tokenizer_config.json +1 -0
special_tokens_map.json CHANGED
@@ -48,6 +48,13 @@
48
  "rstrip": false,
49
  "single_word": false
50
  },
 
 
 
 
 
 
 
51
  "unk_token": {
52
  "content": "<|endoftext|>",
53
  "lstrip": false,
 
48
  "rstrip": false,
49
  "single_word": false
50
  },
51
+ "pad_token": {
52
+ "content": "<|endoftext|>",
53
+ "lstrip": false,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false
57
+ },
58
  "unk_token": {
59
  "content": "<|endoftext|>",
60
  "lstrip": false,
tokenizer_config.json CHANGED
@@ -305,6 +305,7 @@
305
  "clean_up_tokenization_spaces": true,
306
  "eos_token": "<|endoftext|>",
307
  "model_max_length": 1000000000000000019884624838656,
 
308
  "tokenizer_class": "GPT2Tokenizer",
309
  "unk_token": "<|endoftext|>"
310
  }
 
305
  "clean_up_tokenization_spaces": true,
306
  "eos_token": "<|endoftext|>",
307
  "model_max_length": 1000000000000000019884624838656,
308
+ "pad_token": "<|endoftext|>",
309
  "tokenizer_class": "GPT2Tokenizer",
310
  "unk_token": "<|endoftext|>"
311
  }