tarruda commited on
Commit
ce4aeca
·
verified ·
1 Parent(s): c364566

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -42,3 +42,7 @@ Q5_S/MiniMax-M2.7-256x4.9B-Q5_S-00002-of-00004.gguf filter=lfs diff=lfs merge=lf
42
  Q5_S/MiniMax-M2.7-256x4.9B-Q5_S-00003-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
43
  Q5_S/MiniMax-M2.7-256x4.9B-Q5_S-00004-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
44
  imatrix.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
42
  Q5_S/MiniMax-M2.7-256x4.9B-Q5_S-00003-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
43
  Q5_S/MiniMax-M2.7-256x4.9B-Q5_S-00004-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
44
  imatrix.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00001-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00002-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00003-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
48
+ Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00004-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00001-of-00004.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ba34e5363577d34bf56e655d603180f4ed42ffb994fd52f0a8ddee6fb724b43
3
+ size 8237504
Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00002-of-00004.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f959188e12f95f08c0907089e49fb29c12486dc95f33bcab8f8727c332792e7
3
+ size 41983346304
Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00003-of-00004.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceab2f20f0c2651f2738b9891e72979a0d06aa090c76a102ff3c49ce72cfc412
3
+ size 41879006048
Q4_K/MiniMax-M2.7-256x4.9B-Q4_K-00004-of-00004.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48e87054513246853b8ccdcfeb3d64d6a4d3f6a32b25c5298f6c563c0a333f7
3
+ size 27032460384
README.md CHANGED
@@ -7,5 +7,4 @@ Minimax 2.7 quants where I tried to extract the maximum performance for my hardw
7
 
8
  This is the similar as AesSedai IQ4_XS quant (and uses the same imatrix) but the down tensors are replaced:
9
 
10
- - Q4_S replaces IQ4_XS with Q4_K
11
- - Q5_S replaces IQ4_XS with Q5_K
 
7
 
8
  This is the similar as AesSedai IQ4_XS quant (and uses the same imatrix) but the down tensors are replaced:
9
 
10
+ - Q4_K replaces IQ4_XS with Q4_K
 
scripts/quantize.sh CHANGED
@@ -4,14 +4,14 @@ set -euo pipefail
4
 
5
  recipes=(
6
  "
7
- MIX=Q5_S
8
  TYPE_FFN_GATE_UP_EXPS=IQ3_S
9
  TYPE_FFN_DOWN_EXPS=Q5_K
10
  TYPE_DEFAULT=Q8_0
11
  "
12
 
13
  "
14
- MIX=Q4_S
15
  TYPE_FFN_GATE_UP_EXPS=IQ3_S
16
  TYPE_FFN_DOWN_EXPS=Q4_K
17
  TYPE_DEFAULT=Q8_0
 
4
 
5
  recipes=(
6
  "
7
+ MIX=Q5_K
8
  TYPE_FFN_GATE_UP_EXPS=IQ3_S
9
  TYPE_FFN_DOWN_EXPS=Q5_K
10
  TYPE_DEFAULT=Q8_0
11
  "
12
 
13
  "
14
+ MIX=Q4_K
15
  TYPE_FFN_GATE_UP_EXPS=IQ3_S
16
  TYPE_FFN_DOWN_EXPS=Q4_K
17
  TYPE_DEFAULT=Q8_0