Rafs-an09002's picture
Create Dockerfile
c970b1d verified
raw
history blame
842 Bytes
# Nexus-Nano Inference - Ultra Lightweight
# Minimal footprint for maximum speed
FROM python:3.10-slim
WORKDIR /app
RUN apt-get update && apt-get install -y curl && rm -rf /var/lib/apt/lists/*
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt
RUN mkdir -p /app/models
COPY app.py .
# Download Nexus-Nano model
RUN python -c "from huggingface_hub import hf_hub_download; \
hf_hub_download( \
repo_id='GambitFlow/Nexus-Nano', \
filename='nexus_nano.onnx', \
local_dir='/app/models', \
local_dir_use_symlinks=False \
)"
RUN ls -lh /app/models/nexus_nano.onnx
EXPOSE 7860
ENV PYTHONUNBUFFERED=1
ENV OMP_NUM_THREADS=2
HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
CMD curl -f http://localhost:7860/health || exit 1
CMD ["python", "app.py"]