Final_Assignment_Template

Sleeping

App Files Files Community

Kackle commited on Jun 27, 2025

Commit

b652747

verified ·

1 Parent(s): 8117b77

too many tokens used, reducing complexity

Browse files

Files changed (1) hide show

app.py +34 -94

app.py CHANGED Viewed

@@ -105,85 +105,48 @@ class SlpMultiAgent:
         MAX_QUESTION_LENGTH = 1000
         short_question = question  # [:MAX_QUESTION_LENGTH]
-        # Use GPT-3.5-turbo model with optimized settings
         model = OpenAIServerModel(
-            model_id="gpt-3.5-turbo-16k",
-            temperature=0.1,  # Slight randomness for better reasoning
-            max_tokens=1000    # Keep higher tokens for complex reasoning
         )
-        # Create specialized agents for complex problem-solving
         research_agent = CodeAgent(
-            tools=[KnowledgeBaseTool()],
             model=model,
-            additional_authorized_imports=["pandas", "time", "json", "requests", "re", "datetime"],
-            max_steps=4,
             name="ResearchAgent",
             verbosity_level=0,
-            description="Specializes in factual research, historical data, and knowledge retrieval."
         )
-        math_agent = CodeAgent(
             tools=[],
             model=model,
-            additional_authorized_imports=["math", "statistics", "numpy", "pandas", "fractions", "decimal"],
-            max_steps=4,
-            name="MathAgent",
             verbosity_level=0,
-            description="Specializes in mathematical calculations, statistics, and numerical analysis."
-        )
-        logic_agent = CodeAgent(
-            tools=[],
-            model=model,
-            additional_authorized_imports=["itertools", "collections", "re", "string"],
-            max_steps=4,
-            name="LogicAgent",
-            verbosity_level=0,
-            description="Specializes in logical reasoning, pattern recognition, and problem decomposition."
-        )
-        language_agent = CodeAgent(
-            tools=[],
-            model=model,
-            additional_authorized_imports=["re", "string", "collections"],
-            max_steps=3,
-            name="LanguageAgent",
-            verbosity_level=0,
-            description="Specializes in text analysis, word puzzles, linguistics, and language patterns."
-        )
-        data_agent = CodeAgent(
-            tools=[],
-            model=model,
-            additional_authorized_imports=["pandas", "json", "csv", "collections", "statistics"],
-            max_steps=4,
-            name="DataAgent",
-            verbosity_level=0,
-            description="Specializes in data processing, sorting, filtering, and structured analysis."
         )
         manager_agent = CodeAgent(
             model=OpenAIServerModel(
-                model_id="gpt-3.5-turbo-16k",
-                temperature=0.2,  # Slightly higher for better reasoning variety
-                max_tokens=1200
             ),
-            tools=[KnowledgeBaseTool()],
-            managed_agents=[research_agent, math_agent, logic_agent, language_agent, data_agent],
             name="ManagerAgent",
-            description="A manager agent that coordinates research and analysis agents to solve complex questions.",
-            additional_authorized_imports=[
-                "pandas",
-                "time",
-                "json",
-                "requests",
-                "re",
-                "math"
-            ],
-            planning_interval=2,
-            verbosity_level=1,
-            max_steps=10,  # More steps for complex coordination
             final_answer_checks=[check_reasoning]
         )
@@ -199,22 +162,15 @@ class SlpMultiAgent:
                     lambda: manager_agent.run(f"""
                     Question: {short_question}
-                    You have 5 specialized agents available:
-                    - ResearchAgent: Facts, history, knowledge lookup
-                    - MathAgent: Calculations, statistics, numerical problems
-                    - LogicAgent: Logical reasoning, patterns, problem decomposition
-                    - LanguageAgent: Text analysis, word puzzles, linguistics
-                    - DataAgent: Data processing, sorting, structured analysis
-                    Strategy:
-                    1. Analyze question type and complexity
-                    2. Use knowledge_base() for context
-                    3. Delegate to most appropriate specialist agent(s)
-                    4. Synthesize results into final answer
-                    CRITICAL: End with <code>final_answer("exact answer")</code>
-                    Final answer must be direct and specific - no explanations.
                     """)
                 )
                 break  # Success, exit retry loop
@@ -256,24 +212,8 @@ class SlpMultiAgent:
         return result if result else "Unable to determine answer."
 def check_reasoning(final_answer, agent_memory):
-    try:
-        # Simple validation - check if answer looks complete
-        if not final_answer or len(final_answer.strip()) < 1:
-            return False
-        # Check if it's just thoughts/reasoning instead of an answer
-        bad_patterns = ['### Thought:', '### Code:', 'I will', 'Let me', 'First, I', 'Next, I', 'Step 1:', 'Based on']
-        if any(pattern in final_answer for pattern in bad_patterns):
-            return False
-        # Check if answer is too long (likely contains reasoning)
-        if len(final_answer) > 300:
-            return False
-        return True  # Pass if it looks like a real answer
-    except Exception as e:
-        print(f"Error in reasoning check: {e}")
-        return True  # Default to passing on errors
 async def run_and_submit_all(profile):
@@ -337,8 +277,8 @@ async def run_and_submit_all(profile):
     answers_payload = []
     print(f"Running agent on {len(questions_data)} questions...")
-    # Process questions with optimized concurrency
-    semaphore = asyncio.Semaphore(2)  # Process 2 questions at a time for better efficiency
     async def process_question(item):
         task_id = item.get("task_id")

         MAX_QUESTION_LENGTH = 1000
         short_question = question  # [:MAX_QUESTION_LENGTH]
+        # Use cheaper, faster model
         model = OpenAIServerModel(
+            model_id="gpt-3.5-turbo",
+            temperature=0.0,  # Deterministic for consistency
+            max_tokens=400    # Reduced tokens for cost efficiency
         )
+        # Create only essential agents with reduced complexity
         research_agent = CodeAgent(
+            tools=[KnowledgeBaseTool()],  # Remove search to avoid timeouts
             model=model,
+            additional_authorized_imports=["re", "datetime"],
+            max_steps=2,  # Reduced steps for cost
             name="ResearchAgent",
             verbosity_level=0,
+            description="Quick factual research and knowledge lookup."
         )
+        solver_agent = CodeAgent(
             tools=[],
             model=model,
+            additional_authorized_imports=["math", "re", "collections", "itertools"],
+            max_steps=2,  # Reduced steps
+            name="SolverAgent",
             verbosity_level=0,
+            description="Problem solving, calculations, and logical reasoning."
         )
         manager_agent = CodeAgent(
             model=OpenAIServerModel(
+                model_id="gpt-3.5-turbo",
+                temperature=0.0,
+                max_tokens=500
             ),
+            tools=[KnowledgeBaseTool()],  # Only knowledge base
+            managed_agents=[research_agent, solver_agent],  # Only 2 agents
             name="ManagerAgent",
+            description="Efficient manager for quick problem solving.",
+            additional_authorized_imports=["re", "math"],
+            planning_interval=1,  # Faster planning
+            verbosity_level=0,  # Reduce verbosity
+            max_steps=4,  # Drastically reduced steps
             final_answer_checks=[check_reasoning]
         )
                     lambda: manager_agent.run(f"""
                     Question: {short_question}
+                    You have ResearchAgent and SolverAgent. Be efficient:
+                    For factual questions: Use ResearchAgent
+                    For calculations/logic: Use SolverAgent
+                    For simple questions: Answer directly using knowledge_base()
+                    CRITICAL: Always end with <code>final_answer("answer")</code>
+                    Be fast and direct - no lengthy reasoning.
                     """)
                 )
                 break  # Success, exit retry loop
         return result if result else "Unable to determine answer."
 def check_reasoning(final_answer, agent_memory):
+    # Skip expensive validation to save costs
+    return True
 async def run_and_submit_all(profile):
     answers_payload = []
     print(f"Running agent on {len(questions_data)} questions...")
+    # Process questions one at a time to avoid rate limits
+    semaphore = asyncio.Semaphore(1)  # Process 1 question at a time
     async def process_question(item):
         task_id = item.get("task_id")