Spaces:

Distopia22
/

medical-coding-api

Sleeping

Fix: Add robust model loading with safetensors fallback strategies

61e7d9a 8 months ago

1.36 kB

	FROM python:3.10-slim

	WORKDIR /app

	ENV PYTHONUNBUFFERED=1 \
	PYTHONDONTWRITEBYTECODE=1 \
	PIP_NO_CACHE_DIR=1 \
	TRANSFORMERS_CACHE=/app/.cache/transformers \
	HF_HOME=/app/.cache/huggingface \
	HF_HUB_ENABLE_HF_TRANSFER=1

	# Install system dependencies
	RUN apt-get update && apt-get install -y --no-install-recommends \
	git \
	git-lfs \
	build-essential \
	curl \
	ca-certificates \
	wget \
	&& git lfs install \
	&& rm -rf /var/lib/apt/lists/* \
	&& apt-get clean

	# Upgrade pip
	RUN pip install --no-cache-dir --upgrade pip==24.2

	# Install hf_transfer for faster downloads (optional but helps)
	RUN pip install --no-cache-dir hf-transfer==0.1.8

	# Copy and install requirements
	COPY requirements.txt .
	RUN pip install --no-cache-dir -r requirements.txt

	# Copy application
	COPY app/ ./app/

	# Create directories with proper permissions
	RUN mkdir -p /app/offload /app/.cache/transformers /app/.cache/huggingface && \
	chmod -R 777 /app/offload /app/.cache

	EXPOSE 7860

	# Longer startup period for model download
	HEALTHCHECK --interval=30s --timeout=30s --start-period=600s --retries=5 \
	CMD curl -f http://localhost:7860/health \|\| exit 1

	CMD ["uvicorn", "app.api:app", \
	"--host", "0.0.0.0", \
	"--port", "7860", \
	"--timeout-keep-alive", "300", \
	"--workers", "1", \
	"--log-level", "info"]