| # cd /home/mshahidul/llama.cpp | |
| # export CUDA_DEVICE_ORDER=PCI_BUS_ID | |
| # export CUDA_VISIBLE_DEVICES=3 | |
| # ./build/bin/llama-server \ | |
| # -m /home/mshahidul/readctrl/models/translategemma-27b-it-Q8_0.gguf \ | |
| # -ngl 99 \ | |
| # -fa on \ | |
| # -c 16384 \ | |
| # --port 8081 \ | |
| # --host 0.0.0.0 | |
| cd /home/mshahidul/llama.cpp | |
| export CUDA_DEVICE_ORDER=PCI_BUS_ID | |
| export CUDA_VISIBLE_DEVICES=4 | |
| ./build/bin/llama-server \ | |
| -m unsloth/DeepSeek-R1-Distill-Llama-8B-GGUF/DeepSeek-R1-Distill-Llama-8B-Q4_K_M.gguf \ | |
| -ngl 99 \ | |
| -fa on \ | |
| -c 16384 \ | |
| --port 8085 \ | |
| --host 0.0.0.0 |