Spaces:
Paused
Paused
Update Dockerfile
Browse files- Dockerfile +4 -4
Dockerfile
CHANGED
|
@@ -12,10 +12,10 @@ WORKDIR /app
|
|
| 12 |
# You might need to adjust this depending on how you're providing the model
|
| 13 |
COPY ./model /app/model
|
| 14 |
|
| 15 |
-
# Set the environment variable for Hugging Face token
|
| 16 |
-
#
|
| 17 |
-
ENV HUGGING_FACE_HUB_TOKEN="<YOUR_HUGGINGFACE_TOKEN>"
|
| 18 |
|
| 19 |
# Command to run the vLLM OpenAI-compatible server with your model
|
| 20 |
# Replace "your-model-name" with the actual model ID from Hugging Face
|
| 21 |
-
CMD ["python", "-m", "vllm.entrypoints.openai.api_server", "--model", "
|
|
|
|
| 12 |
# You might need to adjust this depending on how you're providing the model
|
| 13 |
COPY ./model /app/model
|
| 14 |
|
| 15 |
+
# Set the environment variable for Hugging Face token (not strictly needed as it's not a gated model, but good practice)
|
| 16 |
+
# You can uncomment this and set it if you prefer.
|
| 17 |
+
# ENV HUGGING_FACE_HUB_TOKEN="<YOUR_HUGGINGFACE_TOKEN>"
|
| 18 |
|
| 19 |
# Command to run the vLLM OpenAI-compatible server with your model
|
| 20 |
# Replace "your-model-name" with the actual model ID from Hugging Face
|
| 21 |
+
CMD ["python", "-m", "vllm.entrypoints.openai.api_server", "--model", "unsloth/Llama-3.2-3B-bnb-4bit", "--host", "0.0.0.0", "--port", "7860"]
|