susnato
/

codeparrot

Text Generation

text-generation-inference

Model card Files Files and versions

susnato commited on Jan 3, 2023

Commit

c329988

·

1 Parent(s): 2557df1

Upload tokenizer

Files changed (1) hide show

tokenizer.json +5 -8

tokenizer.json CHANGED Viewed

@@ -5,32 +5,29 @@
   "added_tokens": [
     {
       "id": 0,
       "content": "<|endoftext|>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": false,
-      "special": true
     }
   ],
   "normalizer": null,
   "pre_tokenizer": {
     "type": "ByteLevel",
     "add_prefix_space": false,
-    "trim_offsets": true,
-    "use_regex": true
   },
   "post_processor": {
     "type": "ByteLevel",
     "add_prefix_space": true,
-    "trim_offsets": false,
-    "use_regex": true
   },
   "decoder": {
     "type": "ByteLevel",
     "add_prefix_space": true,
-    "trim_offsets": true,
-    "use_regex": true
   },
   "model": {
     "type": "BPE",

   "added_tokens": [
     {
       "id": 0,
+      "special": true,
       "content": "<|endoftext|>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false
     }
   ],
   "normalizer": null,
   "pre_tokenizer": {
     "type": "ByteLevel",
     "add_prefix_space": false,
+    "trim_offsets": true
   },
   "post_processor": {
     "type": "ByteLevel",
     "add_prefix_space": true,
+    "trim_offsets": false
   },
   "decoder": {
     "type": "ByteLevel",
     "add_prefix_space": true,
+    "trim_offsets": true
   },
   "model": {
     "type": "BPE",