batmanLovesAI's picture
how much more fix
547ddc8
Raw
History Blame Contribute Delete
220 Bytes
#!/bin/sh
export OLLAMA_HOST=0.0.0.0:7860
# One request at a time
export OLLAMA_NUM_PARALLEL=1
# Smaller queue
export OLLAMA_MAX_QUEUE=128
# Keep model alive for 1 hour
export OLLAMA_KEEP_ALIVE=1h
exec ollama serve