davezaxh commited on
Commit
3f0f32e
·
verified ·
1 Parent(s): a51d594

Upload quantizer.sh with huggingface_hub

Browse files
Files changed (1) hide show
  1. quantizer.sh +25 -0
quantizer.sh ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ TYPES=(
2
+ Q8_0
3
+ Q4_K_M
4
+ IQ4_XS
5
+ IQ3_S
6
+ )
7
+
8
+ mkdir -p quantized
9
+
10
+ for T in "${TYPES[@]}"; do
11
+ echo "$T: Quantization"
12
+
13
+ if [[ $T == IQ* ]]; then
14
+ llama-quantize \
15
+ --imatrix llama-3.2.imatrix \
16
+ llama-3.2-f16.gguf \
17
+ quantized/llama-3.2-$T.gguf \
18
+ $T
19
+ else
20
+ llama-quantize \
21
+ llama-3.2-f16.gguf \
22
+ quantized/llama-3.2-$T.gguf \
23
+ $T
24
+ fi
25
+ done