gemma4-vision-encoder / preprocessor_config.json
rnagabh's picture
Initial upload: Gemma 4 vision encoder (569.6M, 27-layer ViT with 2D RoPE)
3a8691c verified
{
"do_convert_rgb": true,
"do_normalize": false,
"do_rescale": true,
"do_resize": true,
"image_mean": [
0.0,
0.0,
0.0
],
"image_processor_type": "Gemma4ImageProcessor",
"image_seq_length": 280,
"image_std": [
1.0,
1.0,
1.0
],
"max_soft_tokens": 280,
"patch_size": 16,
"pooling_kernel_size": 3,
"resample": 3,
"rescale_factor": 0.00392156862745098
}