binary1ne commited on
Commit
2583f0d
·
verified ·
1 Parent(s): 3c353bd

Create Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +9 -0
Dockerfile ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ FROM harshmanvar/vllm-cpu-only:v1
2
+
3
+
4
+ # Step 10 — Start API server with a model from HF Hub
5
+ CMD ["python", "-m", "vllm.entrypoints.openai.api_server", \
6
+ "--model", "unsloth/Llama-3.2-3B-bnb-4bit", \
7
+ "--host", "0.0.0.0", \
8
+ "--port", "7860", \
9
+ "--trust-remote-code"]