File size: 1,424 Bytes
fb867c3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
{
  "servers": [
    {
      "name": "creative",
      "url": "http://localhost:1234/v1",
      "model": "mistral-7b-instruct",
      "timeout": 120.0,
      "max_concurrent": 4,
      "weight": 1.0,
      "enabled": true,
      "description": "Fast, creative model for research tasks"
    },
    {
      "name": "analytical", 
      "url": "http://localhost:1235/v1",
      "model": "llama-3.1-8b-instruct",
      "timeout": 120.0,
      "max_concurrent": 4,
      "weight": 1.0,
      "enabled": true,
      "description": "Balanced model for analysis and critique"
    },
    {
      "name": "synthesis",
      "url": "http://localhost:1236/v1", 
      "model": "mixtral-8x7b-instruct",
      "timeout": 180.0,
      "max_concurrent": 2,
      "weight": 1.5,
      "enabled": true,
      "description": "High-quality model for synthesis and final output"
    },
    {
      "name": "fallback",
      "url": "http://localhost:1237/v1",
      "model": "phi-3-mini-instruct",
      "timeout": 60.0,
      "max_concurrent": 8,
      "weight": 0.5,
      "enabled": false,
      "description": "Fast fallback model for high-load scenarios"
    }
  ],
  "agent_mapping": {
    "research": "creative",
    "analysis": "analytical", 
    "synthesis": "synthesis",
    "critic": "analytical"
  },
  "load_balance_strategy": "agent_type_mapping",
  "health_check_interval": 30.0,
  "failover_enabled": true,
  "debug_mode": false
}