Naphula commited on
Commit
1cc3c50
·
verified ·
1 Parent(s): fd3b9c3

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -0
README.md CHANGED
@@ -30,6 +30,11 @@ python analyze_old.py A:\HF\hub\!models--inflatebot--MN-12B-Mag-Mell-R1\ablit_pr
30
  sharded_ablate.py magmell.yml --normpreserve
31
  ```
32
 
 
 
 
 
 
33
  ---
34
 
35
  https://huggingface.co/inflatebot/MN-12B-Mag-Mell-R1
 
30
  sharded_ablate.py magmell.yml --normpreserve
31
  ```
32
 
33
+ **Q8_K_XL:**
34
+ ```
35
+ llama-quantize --tensor-type output.weight=F16 --tensor-type token_embd.weight=F16 --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).attn_k.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).attn_k.weight=F16" --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).attn_output.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).attn_output.weight=F16" --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).attn_q.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).attn_q.weight=F16" --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).attn_v.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).attn_v.weight=F16" --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).ffn_down.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).ffn_down.weight=F16" --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).ffn_gate.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).ffn_gate.weight=F16" --tensor-type "blk.(3|4|5|6|7|8|9|10|11|12|13|14|15|16|17|18|19|20|21|22|23|24|25|26|27|28|29|30|31|32|33|34|35|36|37).ffn_up.weight=Q8_0" --tensor-type "blk.(0|1|2|38|39).ffn_up.weight=F16" <input.gguf> <output.gguf> Q8_0
36
+ ```
37
+
38
  ---
39
 
40
  https://huggingface.co/inflatebot/MN-12B-Mag-Mell-R1