Visual Question Answering
Safetensors
File size: 404 Bytes
1b32afc
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
{
  "do_convert_rgb": true,
  "do_normalize": true,
  "font_path": "/cluster/work/projects/nn8104k/kjetil_thesis/.cache/models--ybelkada--fonts/snapshots/7f29c3755a0de4c552c4b474cef01d10eb3d5e8b/Arial.TTF",
  "image_processor_type": "Pix2StructImageProcessor",
  "is_vqa": true,
  "max_patches": 2048,
  "patch_size": {
    "height": 16,
    "width": 16
  },
  "processor_class": "Pix2StructProcessor"
}