Spaces:
Sleeping
Sleeping
Upload settings.py
Browse files- config/settings.py +13 -4
config/settings.py
CHANGED
|
@@ -42,15 +42,16 @@ class ModelSettings:
|
|
| 42 |
agent2_model: str = field(default_factory=lambda: os.getenv("AGENT2_MODEL", "microsoft/Phi-3.5-mini-instruct"))
|
| 43 |
|
| 44 |
# Agent 3 (Advisor): Strong reasoning - MOST IMPORTANT
|
| 45 |
-
# Default:
|
| 46 |
-
|
|
|
|
| 47 |
|
| 48 |
# Agent 4 (Generator): Code/JSON specialist
|
| 49 |
# Default: Mistral Codestral (code specialist)
|
| 50 |
agent4_model: str = field(default_factory=lambda: os.getenv("AGENT4_MODEL", "mistralai/Codestral-22B-v0.1"))
|
| 51 |
|
| 52 |
-
# Fallback
|
| 53 |
-
fallback_model: str = field(default_factory=lambda: os.getenv("FALLBACK_MODEL", "
|
| 54 |
|
| 55 |
|
| 56 |
@dataclass
|
|
@@ -161,9 +162,17 @@ class Settings:
|
|
| 161 |
def get_model_for_agent(self, agent_name: str) -> str:
|
| 162 |
"""Get the model ID for a specific agent."""
|
| 163 |
model_map = {
|
|
|
|
| 164 |
"normalizer": self.models.agent2_model,
|
| 165 |
"advisor": self.models.agent3_model,
|
| 166 |
"generator": self.models.agent4_model,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 167 |
}
|
| 168 |
return model_map.get(agent_name, self.models.fallback_model)
|
| 169 |
|
|
|
|
| 42 |
agent2_model: str = field(default_factory=lambda: os.getenv("AGENT2_MODEL", "microsoft/Phi-3.5-mini-instruct"))
|
| 43 |
|
| 44 |
# Agent 3 (Advisor): Strong reasoning - MOST IMPORTANT
|
| 45 |
+
# Default: Qwen 2.5 72B (freely available on HF serverless, no gated access needed)
|
| 46 |
+
# Alternative: meta-llama/Llama-3.1-70B-Instruct (requires Meta license acceptance)
|
| 47 |
+
agent3_model: str = field(default_factory=lambda: os.getenv("AGENT3_MODEL", "Qwen/Qwen2.5-72B-Instruct"))
|
| 48 |
|
| 49 |
# Agent 4 (Generator): Code/JSON specialist
|
| 50 |
# Default: Mistral Codestral (code specialist)
|
| 51 |
agent4_model: str = field(default_factory=lambda: os.getenv("AGENT4_MODEL", "mistralai/Codestral-22B-v0.1"))
|
| 52 |
|
| 53 |
+
# Fallback (must be freely available on HF serverless inference)
|
| 54 |
+
fallback_model: str = field(default_factory=lambda: os.getenv("FALLBACK_MODEL", "Qwen/Qwen2.5-7B-Instruct"))
|
| 55 |
|
| 56 |
|
| 57 |
@dataclass
|
|
|
|
| 162 |
def get_model_for_agent(self, agent_name: str) -> str:
|
| 163 |
"""Get the model ID for a specific agent."""
|
| 164 |
model_map = {
|
| 165 |
+
# Legacy agents
|
| 166 |
"normalizer": self.models.agent2_model,
|
| 167 |
"advisor": self.models.agent3_model,
|
| 168 |
"generator": self.models.agent4_model,
|
| 169 |
+
|
| 170 |
+
# Stage 2 New Architecture agents
|
| 171 |
+
"brand_identifier": self.models.agent3_model, # Llama 70B - needs context understanding
|
| 172 |
+
"benchmark_advisor": self.models.agent3_model, # Llama 70B - needs reasoning
|
| 173 |
+
"best_practices_validator": self.models.agent3_model, # Llama 70B - needs judgment
|
| 174 |
+
"head_synthesizer": self.models.agent3_model, # Llama 70B - needs synthesis
|
| 175 |
+
"benchmark_extractor": self.models.agent2_model, # Phi-3.5 - structured extraction
|
| 176 |
}
|
| 177 |
return model_map.get(agent_name, self.models.fallback_model)
|
| 178 |
|