Update hf_quant_config.json
Browse files- hf_quant_config.json +2 -1
hf_quant_config.json
CHANGED
|
@@ -7,7 +7,8 @@
|
|
| 7 |
"quant_algo": "FP8",
|
| 8 |
"kv_cache_quant_algo": null,
|
| 9 |
"exclude_modules": [
|
| 10 |
-
"lm_head"
|
|
|
|
| 11 |
]
|
| 12 |
}
|
| 13 |
}
|
|
|
|
| 7 |
"quant_algo": "FP8",
|
| 8 |
"kv_cache_quant_algo": null,
|
| 9 |
"exclude_modules": [
|
| 10 |
+
"lm_head",
|
| 11 |
+
"model.layers.92"
|
| 12 |
]
|
| 13 |
}
|
| 14 |
}
|