sgd-llama-tokenizer / tokenizer_config.json
adibm's picture
Upload tokenizer
a50cd23
{
"add_prefix_space": false,
"additional_special_tokens": [
"<|begintarget|>",
"<|endtarget|>",
"<|begincontext|>",
"<|endcontext|>",
"<|system|>",
"<|user|>",
"<|beginlastuserutterance|>",
"<|endlastuserutterance|>",
"<|begindsts|>",
"<|enddsts|>",
"<|begindst|>",
"<|enddst|>",
"<|beginbelief|>",
"<|endbelief|>",
"<|beginresponse|>",
"<|endresponse|>",
"<|beginaction|>",
"<|endaction|>",
"<|beginuseraction|>",
"<|enduseraction|>",
"<|sysactions|>",
"<|beginintent|>",
"<|endintent|>",
"<|beginrequestedslots|>",
"<|endrequestedslots|>",
"<|promptdst|>",
"<|promptaction|>",
"<|promptresponse|>",
"<|pad|>",
"<|endoftext|>",
"<|startoftext|>",
"<|beginschema|>",
"<|endschema|>",
"<|schemaname|>",
"<|schemadescription|>",
"<|beginschemaintent|>",
"<|endschemaintent|>",
"<|intentrequiredslots|>",
"<|intentresultslots|>",
"<|intentoptionalslots|>",
"<|possiblevalues|>",
"<|endpossiblevalues|>",
"<|beginschemaslot|>",
"<|endschemaslot|>",
"<|schemaslotvalues|>",
"<|beginserviceresults|>",
"<|endserviceresults|>"
],
"bos_token": "<|startoftext|>",
"clean_up_tokenization_spaces": false,
"eos_token": "<|endtarget|>",
"model_max_length": 2048,
"pad_token": "<|pad|>",
"sp_model_kwargs": {},
"tokenizer_class": "LlamaTokenizer",
"unk_token": {
"__type": "AddedToken",
"content": "<unk>",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false
}
}