Spaces:
Running
Running
File size: 1,057 Bytes
789bf58 cb3558e 789bf58 cb3558e 789bf58 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 | services:
llama:
image: ghcr.io/ggml-org/llama.cpp:server
volumes:
- ./finetune/models/qwen-base-run/ckpt-001.gguf:/models/model.gguf:ro
command: >
-m /models/model.gguf
--port 9000
--host 0.0.0.0
--ctx-size 2048
-t 4
healthcheck:
test: ["CMD", "curl", "-f", "http://localhost:9000/health"]
interval: 10s
timeout: 5s
retries: 30
start_period: 30s
app:
build:
context: .
dockerfile: Dockerfile.compose
volumes:
- ./data:/data:ro
environment:
GAZET_DATA_DIR: /data
LLAMA_SERVER_URL: http://llama:9000
ports:
- "8000:8000"
command: uvicorn gazet.api:app --host 0.0.0.0 --port 8000
depends_on:
llama:
condition: service_healthy
demo:
build:
context: .
dockerfile: Dockerfile.compose
environment:
GAZET_API_URL: http://app:8000
ports:
- "8501:8501"
command: streamlit run gazet_demo.py --server.port 8501 --server.address 0.0.0.0
depends_on:
- app
|