Spaces:
Paused
Paused
File size: 1,424 Bytes
fb867c3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 |
{
"servers": [
{
"name": "creative",
"url": "http://localhost:1234/v1",
"model": "mistral-7b-instruct",
"timeout": 120.0,
"max_concurrent": 4,
"weight": 1.0,
"enabled": true,
"description": "Fast, creative model for research tasks"
},
{
"name": "analytical",
"url": "http://localhost:1235/v1",
"model": "llama-3.1-8b-instruct",
"timeout": 120.0,
"max_concurrent": 4,
"weight": 1.0,
"enabled": true,
"description": "Balanced model for analysis and critique"
},
{
"name": "synthesis",
"url": "http://localhost:1236/v1",
"model": "mixtral-8x7b-instruct",
"timeout": 180.0,
"max_concurrent": 2,
"weight": 1.5,
"enabled": true,
"description": "High-quality model for synthesis and final output"
},
{
"name": "fallback",
"url": "http://localhost:1237/v1",
"model": "phi-3-mini-instruct",
"timeout": 60.0,
"max_concurrent": 8,
"weight": 0.5,
"enabled": false,
"description": "Fast fallback model for high-load scenarios"
}
],
"agent_mapping": {
"research": "creative",
"analysis": "analytical",
"synthesis": "synthesis",
"critic": "analytical"
},
"load_balance_strategy": "agent_type_mapping",
"health_check_interval": 30.0,
"failover_enabled": true,
"debug_mode": false
} |