Update handler.py
Browse files- handler.py +1 -4
handler.py
CHANGED
|
@@ -11,10 +11,7 @@ from transformers import AutoModelForVision2Seq, AutoProcessor, BitsAndBytesConf
|
|
| 11 |
model_id = "ibm-granite/granite-vision-3.2-2b"
|
| 12 |
|
| 13 |
bnb_config = BitsAndBytesConfig(
|
| 14 |
-
|
| 15 |
-
bnb_4bit_use_double_quant=True,
|
| 16 |
-
bnb_4bit_quant_type="nf4",
|
| 17 |
-
bnb_4bit_compute_dtype=torch.bfloat16,
|
| 18 |
llm_int8_skip_modules=["vision_tower", "lm_head"],
|
| 19 |
llm_int8_enable_fp32_cpu_offload=True
|
| 20 |
)
|
|
|
|
| 11 |
model_id = "ibm-granite/granite-vision-3.2-2b"
|
| 12 |
|
| 13 |
bnb_config = BitsAndBytesConfig(
|
| 14 |
+
load_in_8bit=True,
|
|
|
|
|
|
|
|
|
|
| 15 |
llm_int8_skip_modules=["vision_tower", "lm_head"],
|
| 16 |
llm_int8_enable_fp32_cpu_offload=True
|
| 17 |
)
|