shahidul034's picture
Add files using upload-large-folder tool
1db7196 verified
# cd /home/mshahidul/llama.cpp
# export CUDA_DEVICE_ORDER=PCI_BUS_ID
# export CUDA_VISIBLE_DEVICES=3
# ./build/bin/llama-server \
# -m /home/mshahidul/readctrl/models/translategemma-27b-it-Q8_0.gguf \
# -ngl 99 \
# -fa on \
# -c 16384 \
# --port 8081 \
# --host 0.0.0.0
cd /home/mshahidul/llama.cpp
export CUDA_DEVICE_ORDER=PCI_BUS_ID
export CUDA_VISIBLE_DEVICES=4
./build/bin/llama-server \
-m unsloth/DeepSeek-R1-Distill-Llama-8B-GGUF/DeepSeek-R1-Distill-Llama-8B-Q4_K_M.gguf \
-ngl 99 \
-fa on \
-c 16384 \
--port 8085 \
--host 0.0.0.0