sujayrittikar
/

mlc_mbert_cased_aug

Model card Files Files and versions

sujayrittikar commited on Dec 16, 2024

Commit

302b88d

·

verified ·

1 Parent(s): d9493f0

Upload tokenizer

Files changed (2) hide show

tokenizer.json +2 -11
tokenizer_config.json +1 -4

tokenizer.json CHANGED Viewed

@@ -2,20 +2,11 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 128,
     "strategy": "LongestFirst",
     "stride": 0
   },
-  "padding": {
-    "strategy": {
-      "Fixed": 128
-    },
-    "direction": "Right",
-    "pad_to_multiple_of": null,
-    "pad_id": 0,
-    "pad_type_id": 0,
-    "pad_token": "[PAD]"
-  },
   "added_tokens": [
     {
       "id": 0,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 10,
     "strategy": "LongestFirst",
     "stride": 0
   },
+  "padding": null,
   "added_tokens": [
     {
       "id": 0,

tokenizer_config.json CHANGED Viewed

@@ -45,12 +45,9 @@
   "cls_token": "[CLS]",
   "do_lower_case": false,
   "mask_token": "[MASK]",
-  "max_length": 128,
   "model_max_length": 512,
-  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
-  "pad_token_type_id": 0,
-  "padding_side": "right",
   "sep_token": "[SEP]",
   "stride": 0,
   "strip_accents": null,

   "cls_token": "[CLS]",
   "do_lower_case": false,
   "mask_token": "[MASK]",
+  "max_length": 10,
   "model_max_length": 512,
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "stride": 0,
   "strip_accents": null,