File size: 378 Bytes
7f07139
e96b55c
 
7f07139
 
 
 
e96b55c
 
7f07139
1
2
3
4
5
6
7
8
9
10
11
{
  "tokenizer_class": "PreTrainedTokenizerFast",
  "model_max_length": 512,
  "bos_token": "<s>",
  "eos_token": "</s>",
  "unk_token": "<unk>",
  "pad_token": "<pad>",
  "clean_up_tokenization_spaces": false,
  "note": "This model uses a tiktoken-based tokenizer (cl100k_base remapped to 8192 tokens). The tokenizer.model file is for reference but requires custom loading."
}