Spaces:
Sleeping
Sleeping
Upload Dockerfile
Browse files- Dockerfile +1 -1
Dockerfile
CHANGED
|
@@ -36,4 +36,4 @@ EXPOSE 7860
|
|
| 36 |
ENTRYPOINT []
|
| 37 |
|
| 38 |
# Set the CMD to launch the vLLM server (for your new model) in the background and then start the Gradio app.
|
| 39 |
-
CMD ["bash", "-c", "vllm.entrypoints.openai.api_server --model unsloth/llama-3-8b-Instruct-bnb-4bit --enable-auto-tool-choice --tool-call-parser llama3_json --chat-template examples/tool_chat_template_llama3.1_json.jinja --quantization bitsandbytes --load-format bitsandbytes --dtype half --max-model-len 8192
|
|
|
|
| 36 |
ENTRYPOINT []
|
| 37 |
|
| 38 |
# Set the CMD to launch the vLLM server (for your new model) in the background and then start the Gradio app.
|
| 39 |
+
CMD ["bash", "-c", "vllm.entrypoints.openai.api_server --model unsloth/llama-3-8b-Instruct-bnb-4bit --enable-auto-tool-choice --tool-call-parser llama3_json --chat-template examples/tool_chat_template_llama3.1_json.jinja --quantization bitsandbytes --load-format bitsandbytes --dtype half --max-model-len 8192 python3 app.py"]
|