LLM-api-speedtest / Dockerfile
krupakar-reddy's picture
Update Dockerfile
1a11952 verified
raw
history blame contribute delete
331 Bytes
FROM python:3.9
WORKDIR /code
COPY ./requirements.txt /code/requirements.txt
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
COPY ./meta-llama-3-8b-instruct.Q4_K_M.gguf /code/meta-llama-3-8b-instruct.Q4_K_M.gguf
COPY ./main.py /code/main.py
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]