Added processor with 128 tokens

Files changed (3) hide show

tokenizer.json CHANGED Viewed

@@ -1,7 +1,14 @@
 {
   "version": "1.0",
   "truncation": null,
-  "padding": null,
   "added_tokens": [
     {
       "id": 49406,

 {
   "version": "1.0",
   "truncation": null,
+  "padding": {
+    "strategy": "BatchLongest",
+    "direction": "Right",
+    "pad_to_multiple_of": null,
+    "pad_id": 49407,
+    "pad_type_id": 0,
+    "pad_token": "<|endoftext|>"
+  },
   "added_tokens": [
     {
       "id": 49406,

tokenizer_config.json CHANGED Viewed

@@ -24,8 +24,9 @@
   "eos_token": "<|endoftext|>",
   "errors": "replace",
   "extra_special_tokens": {},
-  "model_max_length": 77,
   "pad_token": "<|endoftext|>",
   "tokenizer_class": "CLIPTokenizer",
   "unk_token": "<|endoftext|>"
 }

   "eos_token": "<|endoftext|>",
   "errors": "replace",
   "extra_special_tokens": {},
+  "model_max_length": 128,
   "pad_token": "<|endoftext|>",
+  "processor_class": "CLIPProcessor",
   "tokenizer_class": "CLIPTokenizer",
   "unk_token": "<|endoftext|>"
 }

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff