baseten-admin commited on
Commit
3146ce9
·
verified ·
1 Parent(s): 7208caa

Update hf_quant_config.json

Browse files
Files changed (1) hide show
  1. hf_quant_config.json +2 -1
hf_quant_config.json CHANGED
@@ -7,7 +7,8 @@
7
  "quant_algo": "FP8",
8
  "kv_cache_quant_algo": null,
9
  "exclude_modules": [
10
- "lm_head"
 
11
  ]
12
  }
13
  }
 
7
  "quant_algo": "FP8",
8
  "kv_cache_quant_algo": null,
9
  "exclude_modules": [
10
+ "lm_head",
11
+ "model.layers.92"
12
  ]
13
  }
14
  }