Upload model trained with Unsloth

Upload model trained with Unsloth 2x faster

Files changed (3) hide show

special_tokens_map.json CHANGED Viewed

@@ -14,7 +14,7 @@
     "single_word": false
   },
   "pad_token": {
-    "content": "<|reserved_special_token_250|>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,

     "single_word": false
   },
   "pad_token": {
+    "content": "<|end_of_text|>",
     "lstrip": false,
     "normalized": false,
     "rstrip": false,

tokenizer.json CHANGED Viewed

@@ -2329,69 +2329,10 @@
     ]
   },
   "post_processor": {
-    "type": "Sequence",
-    "processors": [
-      {
-        "type": "ByteLevel",
-        "add_prefix_space": true,
-        "trim_offsets": false,
-        "use_regex": true
-      },
-      {
-        "type": "TemplateProcessing",
-        "single": [
-          {
-            "SpecialToken": {
-              "id": "<|begin_of_text|>",
-              "type_id": 0
-            }
-          },
-          {
-            "Sequence": {
-              "id": "A",
-              "type_id": 0
-            }
-          }
-        ],
-        "pair": [
-          {
-            "SpecialToken": {
-              "id": "<|begin_of_text|>",
-              "type_id": 0
-            }
-          },
-          {
-            "Sequence": {
-              "id": "A",
-              "type_id": 0
-            }
-          },
-          {
-            "SpecialToken": {
-              "id": "<|begin_of_text|>",
-              "type_id": 1
-            }
-          },
-          {
-            "Sequence": {
-              "id": "B",
-              "type_id": 1
-            }
-          }
-        ],
-        "special_tokens": {
-          "<|begin_of_text|>": {
-            "id": "<|begin_of_text|>",
-            "ids": [
-              128000
-            ],
-            "tokens": [
-              "<|begin_of_text|>"
-            ]
-          }
-        }
-      }
-    ]
   },
   "decoder": {
     "type": "ByteLevel",

     ]
   },
   "post_processor": {
+    "type": "ByteLevel",
+    "add_prefix_space": true,
+    "trim_offsets": false,
+    "use_regex": true
   },
   "decoder": {
     "type": "ByteLevel",

tokenizer_config.json CHANGED Viewed

@@ -2058,7 +2058,7 @@
     "attention_mask"
   ],
   "model_max_length": 8192,
-  "pad_token": "<|reserved_special_token_250|>",
-  "padding_side": "left",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

     "attention_mask"
   ],
   "model_max_length": 8192,
+  "pad_token": "<|end_of_text|>",
+  "padding_side": "right",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }