riazmo commited on
Commit
8fc9c81
·
verified ·
1 Parent(s): 4abbd8b

Upload settings.py

Browse files
Files changed (1) hide show
  1. config/settings.py +13 -4
config/settings.py CHANGED
@@ -42,15 +42,16 @@ class ModelSettings:
42
  agent2_model: str = field(default_factory=lambda: os.getenv("AGENT2_MODEL", "microsoft/Phi-3.5-mini-instruct"))
43
 
44
  # Agent 3 (Advisor): Strong reasoning - MOST IMPORTANT
45
- # Default: Meta Llama 70B (excellent reasoning)
46
- agent3_model: str = field(default_factory=lambda: os.getenv("AGENT3_MODEL", "meta-llama/Llama-3.1-70B-Instruct"))
 
47
 
48
  # Agent 4 (Generator): Code/JSON specialist
49
  # Default: Mistral Codestral (code specialist)
50
  agent4_model: str = field(default_factory=lambda: os.getenv("AGENT4_MODEL", "mistralai/Codestral-22B-v0.1"))
51
 
52
- # Fallback
53
- fallback_model: str = field(default_factory=lambda: os.getenv("FALLBACK_MODEL", "mistralai/Mistral-7B-Instruct-v0.3"))
54
 
55
 
56
  @dataclass
@@ -161,9 +162,17 @@ class Settings:
161
  def get_model_for_agent(self, agent_name: str) -> str:
162
  """Get the model ID for a specific agent."""
163
  model_map = {
 
164
  "normalizer": self.models.agent2_model,
165
  "advisor": self.models.agent3_model,
166
  "generator": self.models.agent4_model,
 
 
 
 
 
 
 
167
  }
168
  return model_map.get(agent_name, self.models.fallback_model)
169
 
 
42
  agent2_model: str = field(default_factory=lambda: os.getenv("AGENT2_MODEL", "microsoft/Phi-3.5-mini-instruct"))
43
 
44
  # Agent 3 (Advisor): Strong reasoning - MOST IMPORTANT
45
+ # Default: Qwen 2.5 72B (freely available on HF serverless, no gated access needed)
46
+ # Alternative: meta-llama/Llama-3.1-70B-Instruct (requires Meta license acceptance)
47
+ agent3_model: str = field(default_factory=lambda: os.getenv("AGENT3_MODEL", "Qwen/Qwen2.5-72B-Instruct"))
48
 
49
  # Agent 4 (Generator): Code/JSON specialist
50
  # Default: Mistral Codestral (code specialist)
51
  agent4_model: str = field(default_factory=lambda: os.getenv("AGENT4_MODEL", "mistralai/Codestral-22B-v0.1"))
52
 
53
+ # Fallback (must be freely available on HF serverless inference)
54
+ fallback_model: str = field(default_factory=lambda: os.getenv("FALLBACK_MODEL", "Qwen/Qwen2.5-7B-Instruct"))
55
 
56
 
57
  @dataclass
 
162
  def get_model_for_agent(self, agent_name: str) -> str:
163
  """Get the model ID for a specific agent."""
164
  model_map = {
165
+ # Legacy agents
166
  "normalizer": self.models.agent2_model,
167
  "advisor": self.models.agent3_model,
168
  "generator": self.models.agent4_model,
169
+
170
+ # Stage 2 New Architecture agents
171
+ "brand_identifier": self.models.agent3_model, # Llama 70B - needs context understanding
172
+ "benchmark_advisor": self.models.agent3_model, # Llama 70B - needs reasoning
173
+ "best_practices_validator": self.models.agent3_model, # Llama 70B - needs judgment
174
+ "head_synthesizer": self.models.agent3_model, # Llama 70B - needs synthesis
175
+ "benchmark_extractor": self.models.agent2_model, # Phi-3.5 - structured extraction
176
  }
177
  return model_map.get(agent_name, self.models.fallback_model)
178