| name: kokoro-fastapi-cpu | |
| services: | |
| kokoro-tts: | |
| build: | |
| context: ../.. | |
| dockerfile: docker/cpu/Dockerfile | |
| volumes: | |
| - ../../api:/app/api | |
| ports: | |
| - "8880:8880" | |
| environment: | |
| - PYTHONPATH=/app:/app/api | |
| # ONNX Optimization Settings for vectorized operations | |
| - ONNX_NUM_THREADS=8 # Maximize core usage for vectorized ops | |
| - ONNX_INTER_OP_THREADS=4 # Higher inter-op for parallel matrix operations | |
| - ONNX_EXECUTION_MODE=parallel | |
| - ONNX_OPTIMIZATION_LEVEL=all | |
| - ONNX_MEMORY_PATTERN=true | |
| - ONNX_ARENA_EXTEND_STRATEGY=kNextPowerOfTwo | |
| # # Gradio UI service [Comment out everything below if you don't need it] | |
| # gradio-ui: | |
| # image: ghcr.io/remsky/kokoro-fastapi-ui:v0.2.0 | |
| # # Uncomment below (and comment out above) to build from source instead of using the released image | |
| # build: | |
| # context: ../../ui | |
| # ports: | |
| # - "7860:7860" | |
| # volumes: | |
| # - ../../ui/data:/app/ui/data | |
| # - ../../ui/app.py:/app/app.py # Mount app.py for hot reload | |
| # environment: | |
| # - GRADIO_WATCH=True # Enable hot reloading | |
| # - PYTHONUNBUFFERED=1 # Ensure Python output is not buffered | |
| # - DISABLE_LOCAL_SAVING=false # Set to 'true' to disable local saving and hide file view | |
| # - API_HOST=kokoro-tts # Set TTS service URL | |
| # - API_PORT=8880 # Set TTS service PORT |