#!/bin/sh export OLLAMA_HOST=0.0.0.0:7860 # One request at a time export OLLAMA_NUM_PARALLEL=1 # Smaller queue export OLLAMA_MAX_QUEUE=128 # Keep model alive for 1 hour export OLLAMA_KEEP_ALIVE=1h exec ollama serve