binary1ne commited on
Commit
aa8dffb
·
verified ·
1 Parent(s): d87cc75

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +8 -1
Dockerfile CHANGED
@@ -36,5 +36,12 @@ RUN vllm -v
36
  # WORKDIR /workspace
37
  # ENTRYPOINT ["./start_server.sh"]
38
 
39
- RUN vllm serve unsloth/Llama-3.2-1B-bnb-4bit --host 0.0.0.0 --port 7860 --cpu-num-threads 2
40
  # CMD ["vllm serve unsloth/Llama-3.2-1B-bnb-4bit --host 0.0.0.0 --port 7860"]
 
 
 
 
 
 
 
 
36
  # WORKDIR /workspace
37
  # ENTRYPOINT ["./start_server.sh"]
38
 
39
+ # RUN vllm serve unsloth/Llama-3.2-1B-bnb-4bit --host 0.0.0.0 --port 7860 --cpu-num-threads 2
40
  # CMD ["vllm serve unsloth/Llama-3.2-1B-bnb-4bit --host 0.0.0.0 --port 7860"]
41
+ CMD python3 -u -m vllm.entrypoints.openai.api_server \
42
+ --model "unsloth/Llama-3.2-1B-bnb-4bit" \
43
+ --host 0.0.0.0 \
44
+ --port 7860 \
45
+ --tensor-parallel-size 1 \
46
+ --gpu-memory-utilization 0.0 \
47
+ --num-cpu-threads 2