Fix tokenizer to not produce token_type_ids (ModernBERT compatibility)
Browse files- tokenizer_config.json +1 -0
tokenizer_config.json
CHANGED
|
@@ -1,6 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"additional_special_tokens": null,
|
| 3 |
"backend": "tokenizers",
|
|
|
|
| 4 |
"bos_token": "<|start|>",
|
| 5 |
"cls_token": "<|cls|>",
|
| 6 |
"eos_token": "<|end|>",
|
|
|
|
| 1 |
{
|
| 2 |
"additional_special_tokens": null,
|
| 3 |
"backend": "tokenizers",
|
| 4 |
+
"model_input_names": ["input_ids", "attention_mask"],
|
| 5 |
"bos_token": "<|start|>",
|
| 6 |
"cls_token": "<|cls|>",
|
| 7 |
"eos_token": "<|end|>",
|