tomhflau commited on
Commit
eca8a31
ยท
1 Parent(s): 54c2fa5

added new system prompt

Browse files
Files changed (1) hide show
  1. app.py +21 -13
app.py CHANGED
@@ -347,24 +347,32 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
347
 
348
  # --- Build Gradio Interface using Blocks ---
349
  with gr.Blocks() as demo:
350
- gr.Markdown("# SmolAgent Evaluation Runner for GAIA")
351
  gr.Markdown(
352
  """
353
- **Instructions:**
354
-
355
- 1. This agent uses smolagents framework with multiple tools:
356
- - ๐Ÿ” **DuckDuckGoSearchTool**: Web search capabilities
357
- - ๐ŸŒ **VisitWebpageTool**: Can visit and read web pages
358
- - ๐Ÿงฎ **Math Calculator**: Handles mathematical calculations
359
- - ๐Ÿ“Š **Data Analysis**: Basic data analysis capabilities
360
- - โœ… **Fact Checker**: Helps verify claims
361
- - ๐Ÿง  **Advanced Reasoning**: Structured problem-solving
362
 
363
- 2. Log in to your Hugging Face account using the button below.
364
- 3. Click 'Run Evaluation & Submit All Answers' to start the evaluation.
 
 
 
 
 
 
 
 
365
 
366
  ---
367
- **Note:** This agent is designed for the GAIA dataset and can handle complex, multi-step reasoning tasks.
368
  """
369
  )
370
 
 
347
 
348
  # --- Build Gradio Interface using Blocks ---
349
  with gr.Blocks() as demo:
350
+ gr.Markdown("# ๐Ÿค– SmolAgent GAIA Evaluation Runner")
351
  gr.Markdown(
352
  """
353
+ **Enhanced Agent for GAIA Dataset:**
354
+
355
+ ๐Ÿ› ๏ธ **Tools Available:**
356
+ - ๐Ÿ” **DuckDuckGoSearchTool**: Real-time web search capabilities
357
+ - ๐ŸŒ **VisitWebpageTool**: Can visit and analyze web pages
358
+ - ๐Ÿงฎ **Math Calculator**: Safe mathematical calculations
359
+ - ๐Ÿ“Š **Data Analysis**: Basic data analysis capabilities
360
+ - โœ… **Fact Checker**: Helps verify claims with authoritative sources
361
+ - ๐Ÿง  **Advanced Reasoning**: Structured problem-solving approach
362
 
363
+ ๐ŸŽฏ **GAIA Format Compliance:**
364
+ - Numbers without commas or units (unless specified)
365
+ - Strings without articles or abbreviations
366
+ - Proper comma-separated lists
367
+ - Extracts only the final answer for submission
368
+
369
+ **Instructions:**
370
+ 1. Log in to your Hugging Face account using the button below.
371
+ 2. Click 'Run Evaluation & Submit All Answers' to start the evaluation.
372
+ 3. The agent will process all questions using multiple tools and reasoning steps.
373
 
374
  ---
375
+ **Note:** This agent follows GAIA's strict answer formatting requirements and uses advanced reasoning with multiple tools.
376
  """
377
  )
378