# === Default backend: plain text llama.cpp server (no audio) === # OpenBMB MiniCPM4.1-8B (text-only). Chosen as the default because it stays in # English reliably, unlike the MiniCPM-o omni model. PHANTOM_GRID_LLM_PROVIDER=llama_cpp_server PHANTOM_GRID_LLM_MODEL=MiniCPM4.1-8B-Q4_K_M.gguf PHANTOM_GRID_LLAMACPP_MODEL_PATH=runtime/models/MiniCPM4.1-8B-gguf/MiniCPM4.1-8B-Q4_K_M.gguf # Reuse the llama-server built for the omni stack (it also serves plain text GGUFs), # or any standalone llama.cpp build / installed llama-server. PHANTOM_GRID_LLAMACPP_SERVER_BIN=runtime/llama.cpp-omni/build/bin/Release/llama-server.exe PHANTOM_GRID_LLAMACPP_BASE_URL=http://127.0.0.1:8080/v1 PHANTOM_GRID_LLAMACPP_CONTEXT_LENGTH=8192 PHANTOM_GRID_LLAMACPP_GPU_LAYERS=auto PHANTOM_GRID_GPU_DEVICE=auto # Text backend has no voice; keep TTS off. PHANTOM_GRID_WITNESS_CHAT_TTS=0 # === Optional: MiniCPM-o omni voice mode === # WARNING: The MiniCPM-o omni model frequently hallucinates and drifts into # Chinese (especially its TTS/audio branch), even on English-only prompts. Use # it only if you need synthesized witness voices, and expect occasional Chinese # output. To enable, set PHANTOM_GRID_LLM_PROVIDER=minicpm_omni and TTS=1. PHANTOM_GRID_OMNI_GATEWAY_URL=http://127.0.0.1:8006 PHANTOM_GRID_OMNI_LAUNCHER_PATH=scripts/launch_minicpm_omni.py PHANTOM_GRID_COMNI_CHECKOUT_PATH=runtime/MiniCPM-o-Demo PHANTOM_GRID_LLAMACPP_OMNI_ROOT=runtime/llama.cpp-omni PHANTOM_GRID_MINICPM_MODEL_DIR=runtime/models/MiniCPM-o-4_5-gguf PHANTOM_GRID_MINICPM_QUANTIZATION=MiniCPM-o-4_5-Q4_K_M.gguf # === Gameplay === PHANTOM_GRID_WITNESS_VOICE_DIR=data\voices PHANTOM_GRID_MAX_TURNS=12 PHANTOM_GRID_CHECKS_PER_TURN=2 PHANTOM_GRID_BLOCKS_PER_TURN=1 PHANTOM_GRID_INDIVIDUAL_WITNESS_THRESHOLD=12 PHANTOM_GRID_MEMORY_CORRUPTION_PER_TURN=0.08