Portx commited on
Commit
f18c4d2
·
verified ·
1 Parent(s): a2b6dcd

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +1 -4
handler.py CHANGED
@@ -11,10 +11,7 @@ from transformers import AutoModelForVision2Seq, AutoProcessor, BitsAndBytesConf
11
  model_id = "ibm-granite/granite-vision-3.2-2b"
12
 
13
  bnb_config = BitsAndBytesConfig(
14
- load_in_4bit=True,
15
- bnb_4bit_use_double_quant=True,
16
- bnb_4bit_quant_type="nf4",
17
- bnb_4bit_compute_dtype=torch.bfloat16,
18
  llm_int8_skip_modules=["vision_tower", "lm_head"],
19
  llm_int8_enable_fp32_cpu_offload=True
20
  )
 
11
  model_id = "ibm-granite/granite-vision-3.2-2b"
12
 
13
  bnb_config = BitsAndBytesConfig(
14
+ load_in_8bit=True,
 
 
 
15
  llm_int8_skip_modules=["vision_tower", "lm_head"],
16
  llm_int8_enable_fp32_cpu_offload=True
17
  )