Pradnya27
/

codegpt-finetuned-code-generation

Model card Files Files and versions

Pradnya27 commited on May 2

Commit

80468d8

·

verified ·

1 Parent(s): d6586df

Upload tokenizer

Files changed (2) hide show

tokenizer.json +25 -5
tokenizer_config.json +2 -45

tokenizer.json CHANGED Viewed

@@ -18,7 +18,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     },
     {
@@ -57,10 +57,30 @@
     "use_regex": true
   },
   "post_processor": {
-    "type": "ByteLevel",
-    "add_prefix_space": true,
-    "trim_offsets": false,
-    "use_regex": true
   },
   "decoder": {
     "type": "ByteLevel",

       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     },
     {
     "use_regex": true
   },
   "post_processor": {
+    "type": "TemplateProcessing",
+    "single": [
+      {
+        "Sequence": {
+          "id": "A",
+          "type_id": 0
+        }
+      }
+    ],
+    "pair": [
+      {
+        "Sequence": {
+          "id": "A",
+          "type_id": 0
+        }
+      },
+      {
+        "Sequence": {
+          "id": "B",
+          "type_id": 1
+        }
+      }
+    ],
+    "special_tokens": {}
   },
   "decoder": {
     "type": "ByteLevel",

tokenizer_config.json CHANGED Viewed

@@ -1,54 +1,11 @@
 {
-  "add_bos_token": false,
   "add_prefix_space": false,
-  "added_tokens_decoder": {
-    "0": {
-      "content": "<s>",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "1": {
-      "content": "<pad>",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "2": {
-      "content": "</s>",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "50000": {
-      "content": "<EOL>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "50001": {
-      "content": "<|UNKNOWN|>",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    }
-  },
   "bos_token": "<s>",
-  "clean_up_tokenization_spaces": false,
   "eos_token": "</s>",
   "errors": "replace",
-  "extra_special_tokens": {},
   "full_tokenizer_file": null,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
   "sep_token": "<EOL>",

 {
   "add_prefix_space": false,
+  "backend": "tokenizers",
   "bos_token": "<s>",
   "eos_token": "</s>",
   "errors": "replace",
   "full_tokenizer_file": null,
+  "is_local": false,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
   "sep_token": "<EOL>",