NVILA-8B-HD-Video / preprocessor_config.json
Danny Yin
release
73b433d
raw
history blame contribute delete
869 Bytes
{
"auto_map": {
"AutoProcessor": "processing_nvila.NVILAProcessor"
},
"do_convert_rgb": null,
"do_normalize": true,
"do_rescale": true,
"do_resize": true,
"image_mean": [
0.5,
0.5,
0.5
],
"image_processor_type": "SiglipImageProcessor",
"image_std": [
0.5,
0.5,
0.5
],
"processor_class": "NVILAProcessor",
"resample": 3,
"rescale_factor": 0.00392156862745098,
"size": {
"height": 392,
"width": 392
},
"autogaze_model_id": "bfshi/AutoGaze",
"gazing_ratio_tile": 0.75,
"gazing_ratio_thumbnail": 0.75,
"task_loss_requirement_tile": 0.7,
"task_loss_requirement_thumbnail": 0.7,
"target_scales": [56, 112, 196, 392],
"target_patch_size": 16,
"num_video_frames": 8,
"max_tiles_video": 8,
"num_video_frames_thumbnail": 8,
"mm_projector_shuffle_num": 9,
"max_batch_size_autogaze": 32
}