Brunobkr commited on
Commit
a393970
·
verified ·
1 Parent(s): 3be9d1e

Upload RUN_SERVER.txt

Browse files
Files changed (1) hide show
  1. RUN_SERVER.txt +29 -0
RUN_SERVER.txt ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ QUANTIZAÇÃO -------------------------------------------------------------------------------------------
2
+
3
+ -------------------------------------------------------------------------------------------------------------
4
+ ./llama.cpp/build/bin/llama-quantize ./GGUFS/granite-3.3-8b-instruct-f16.gguf ./GGUFS/ΩFFΣLLIα_granite-3.3-8b-instruct-Q4_K_M.gguf Q4_K_M
5
+
6
+
7
+ -------------------------------------------------------------------------------------------------------------
8
+
9
+
10
+ /home/userk21/llama.cpp/build/bin/llama-server \
11
+ -m /home/userk21/GGUFS/ΩFFΣLLIα_LFM2-8B-A1B-Q6_K.gguf \
12
+ --ctx-size 120000
13
+ --threads $(nproc) \
14
+ --ignore-eos \
15
+ --n-predict -1
16
+ --flash-attn on \
17
+ --port 3301 \
18
+ --host 0.0.0.0
19
+
20
+ ------------------------------------------------------------------------------------------------------------
21
+
22
+ /home/userk21/llama.cpp/build/bin/llama-server \
23
+ -m /home/userk21/GGUFS/ΩFFΣLLIα_granite-3.3-8b-instruct-Q4_K_M.gguf \
24
+ --threads $(nproc) \
25
+ --ignore-eos \
26
+ --n-predict -1
27
+ --flash-attn on \
28
+ --port 3301 \
29
+ --host 0.0.0.0