config.json CHANGED
@@ -14,7 +14,7 @@
14
  "hidden_size": 8192,
15
  "initializer_range": 0.02,
16
  "intermediate_size": 29568,
17
- "max_position_embeddings": 65537,
18
  "max_window_layers": 80,
19
  "model_type": "qwen2_vl",
20
  "num_attention_heads": 64,
 
14
  "hidden_size": 8192,
15
  "initializer_range": 0.02,
16
  "intermediate_size": 29568,
17
+ "max_position_embeddings": 32768,
18
  "max_window_layers": 80,
19
  "model_type": "qwen2_vl",
20
  "num_attention_heads": 64,
preprocessor_config.json CHANGED
@@ -8,6 +8,7 @@
8
  0.4578275,
9
  0.40821073
10
  ],
 
11
  "image_std": [
12
  0.26862954,
13
  0.26130258,
@@ -21,8 +22,8 @@
21
  "resample": 3,
22
  "rescale_factor": 0.00392156862745098,
23
  "size": {
24
- "longest_edge": 2116800,
25
- "shortest_edge": 3136
26
  },
27
  "temporal_patch_size": 2
28
  }
 
8
  0.4578275,
9
  0.40821073
10
  ],
11
+ "image_processor_type": "Qwen2VLImageProcessor",
12
  "image_std": [
13
  0.26862954,
14
  0.26130258,
 
22
  "resample": 3,
23
  "rescale_factor": 0.00392156862745098,
24
  "size": {
25
+ "max_pixels": 2116800,
26
+ "min_pixels": 3136
27
  },
28
  "temporal_patch_size": 2
29
  }
tokenizer_config.json CHANGED
@@ -140,5 +140,6 @@
140
  "padding_side": "right",
141
  "processor_class": "Qwen2VLProcessor",
142
  "split_special_tokens": false,
 
143
  "unk_token": null
144
  }
 
140
  "padding_side": "right",
141
  "processor_class": "Qwen2VLProcessor",
142
  "split_special_tokens": false,
143
+ "tokenizer_class": "Qwen2Tokenizer",
144
  "unk_token": null
145
  }