SatorTenet commited on
Commit
ae44094
·
verified ·
1 Parent(s): a0c8b11

v2: Add onboarding & redirect training (greeting, off-topic, free-text choices)

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. tokenizer_config.json +1 -1
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b25b89758093eaad174a71ec8fb85292ca01b3fed629b332118563088c9f9e40
3
  size 3763691728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd7b451c148acf7a280b42f34f7779dbbd587d85ce8aeb580fb1ef1a7a5a1095
3
  size 3763691728
tokenizer_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "vision_bos_token": "<|vision_start|>",
21
  "vision_eos_token": "<|vision_end|>"
22
  },
23
- "pad_token": "<|im_end|>",
24
  "pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
25
  "split_special_tokens": false,
26
  "tokenizer_class": "TokenizersBackend",
 
20
  "vision_bos_token": "<|vision_start|>",
21
  "vision_eos_token": "<|vision_end|>"
22
  },
23
+ "pad_token": "<|endoftext|>",
24
  "pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
25
  "split_special_tokens": false,
26
  "tokenizer_class": "TokenizersBackend",