alina0195
/

ro-tokenizer

alina0195 commited on Dec 4, 2025

Commit

cd9e7ed

verified ·

1 Parent(s): 306229e

init

Files changed (2) hide show

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "add_prefix_space": false,
   "added_tokens_decoder": {
     "0": {
       "content": "[MASK]",
@@ -228,12 +227,7 @@
   },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
-  "extra_special_tokens": {},
   "mask_token": "[MASK]",
-  "model_input_names": [
-    "input_ids",
-    "attention_mask"
-  ],
   "model_max_length": 128000,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",

 {
   "added_tokens_decoder": {
     "0": {
       "content": "[MASK]",
   },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "mask_token": "[MASK]",
   "model_max_length": 128000,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",