| # Use a small Python image | |
| FROM python:3.11-slim | |
| # Set working folder | |
| WORKDIR /app | |
| # Copy only deps first for better caching | |
| COPY requirements.txt . | |
| # Install FastAPI, uvicorn, meta-ai-api, openai | |
| RUN pip install --no-cache-dir -r requirements.txt | |
| # Copy rest of code | |
| COPY . . | |
| # Let FastAPI know which model to use | |
| # You can override this when you run the container | |
| ENV MODEL_NAME=llama-3-70b | |
| # Expose port | |
| EXPOSE 7860 | |
| # Start the app | |
| CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"] | |