binary1ne commited on
Commit
9dcedc3
·
verified ·
1 Parent(s): 3ac3871

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +4 -4
Dockerfile CHANGED
@@ -12,10 +12,10 @@ WORKDIR /app
12
  # You might need to adjust this depending on how you're providing the model
13
  COPY ./model /app/model
14
 
15
- # Set the environment variable for Hugging Face token if you're using gated models
16
- # Replace <YOUR_HUGGINGFACE_TOKEN> with your actual token
17
- ENV HUGGING_FACE_HUB_TOKEN="<YOUR_HUGGINGFACE_TOKEN>"
18
 
19
  # Command to run the vLLM OpenAI-compatible server with your model
20
  # Replace "your-model-name" with the actual model ID from Hugging Face
21
- CMD ["python", "-m", "vllm.entrypoints.openai.api_server", "--model", "your-model-name", "--host", "0.0.0.0", "--port", "8000"]
 
12
  # You might need to adjust this depending on how you're providing the model
13
  COPY ./model /app/model
14
 
15
+ # Set the environment variable for Hugging Face token (not strictly needed as it's not a gated model, but good practice)
16
+ # You can uncomment this and set it if you prefer.
17
+ # ENV HUGGING_FACE_HUB_TOKEN="<YOUR_HUGGINGFACE_TOKEN>"
18
 
19
  # Command to run the vLLM OpenAI-compatible server with your model
20
  # Replace "your-model-name" with the actual model ID from Hugging Face
21
+ CMD ["python", "-m", "vllm.entrypoints.openai.api_server", "--model", "unsloth/Llama-3.2-3B-bnb-4bit", "--host", "0.0.0.0", "--port", "7860"]