Spaces:

robell05
/

GptForChess

Sleeping

GptForChess / Dockerfile

serving model

6d75857 18 days ago

1.23 kB

	FROM python:3.12.2-slim

	ENV PYTHONDONTWRITEBYTECODE=1 \
	PYTHONUNBUFFERED=1 \
	PIP_NO_CACHE_DIR=1

	# build-essential covers the few deps with C extensions (numpy/pandas wheels
	# are usually prebuilt for 3.12, but this is cheap insurance).
	RUN apt-get update && apt-get install -y --no-install-recommends \
	build-essential \
	&& rm -rf /var/lib/apt/lists/*

	WORKDIR /app

	# Deps first so editing app.py doesn't reinstall torch on every rebuild.
	COPY requirements.txt .
	RUN pip install --extra-index-url https://download.pytorch.org/whl/cpu -r requirements.txt

	# Source next.
	COPY src/ ./src/
	COPY app.py ./

	# Weights last — biggest layer, changes least often, so cache stays warm
	# when you iterate on app.py.
	COPY model/ ./model/

	# torch.load on tokenizer.pt unpickles a `Tokenizer` instance that was
	# saved from the module path `tokenizer` (src/tokenizer.py). Making /app/src
	# importable lets the unpickler find that class.
	ENV PYTHONPATH=/app/src

	# HF Spaces routes external traffic to $PORT; 7860 is the convention.
	# Single worker — the model lives in process memory and multiple workers
	# would multiply the ~1.5 GB RSS.
	EXPOSE 7860
	CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"]