uitars

@@ -14,7 +14,7 @@
   "hidden_size": 8192,
   "initializer_range": 0.02,
   "intermediate_size": 29568,
-  "max_position_embeddings": 65537,
   "max_window_layers": 80,
   "model_type": "qwen2_vl",
   "num_attention_heads": 64,

   "hidden_size": 8192,
   "initializer_range": 0.02,
   "intermediate_size": 29568,
+  "max_position_embeddings": 32768,
   "max_window_layers": 80,
   "model_type": "qwen2_vl",
   "num_attention_heads": 64,

preprocessor_config.json CHANGED Viewed

@@ -8,6 +8,7 @@
     0.4578275,
     0.40821073
   ],
   "image_std": [
     0.26862954,
     0.26130258,
@@ -21,8 +22,8 @@
   "resample": 3,
   "rescale_factor": 0.00392156862745098,
   "size": {
-    "longest_edge": 2116800,
-    "shortest_edge": 3136
   },
   "temporal_patch_size": 2
 }

     0.4578275,
     0.40821073
   ],
+  "image_processor_type": "Qwen2VLImageProcessor",
   "image_std": [
     0.26862954,
     0.26130258,
   "resample": 3,
   "rescale_factor": 0.00392156862745098,
   "size": {
+    "max_pixels": 2116800,
+    "min_pixels": 3136
   },
   "temporal_patch_size": 2
 }

tokenizer_config.json CHANGED Viewed

@@ -140,5 +140,6 @@
   "padding_side": "right",
   "processor_class": "Qwen2VLProcessor",
   "split_special_tokens": false,
   "unk_token": null
 }

   "padding_side": "right",
   "processor_class": "Qwen2VLProcessor",
   "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null
 }