#!/usr/bin/env bash set -euo pipefail ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)" cd "$ROOT" MODELS="${MODELS:-gpt-oss}" ROUTER_AGENT="${ROUTER_AGENT:-hf_hub_community}" ROUTER_AGENT_CARDS="${ROUTER_AGENT_CARDS:-$ROOT/.fast-agent/tool-cards}" TIMEOUT="${TIMEOUT:-240}" RUN_COMMUNITY="${RUN_COMMUNITY:-1}" RUN_ROUTING="${RUN_ROUTING:-1}" RUN_DESC_AB="${RUN_DESC_AB:-1}" echo "[info] root=$ROOT" echo "[info] models=$MODELS" echo "[info] router_agent=$ROUTER_AGENT" echo "[info] router_agent_cards=$ROUTER_AGENT_CARDS" action() { echo; echo "========== $* =========="; } if [[ "$RUN_COMMUNITY" == "1" ]]; then action "HF Hub community challenge scoring" python scripts/score_hf_hub_community_challenges.py --timeout "$TIMEOUT" fi if [[ "$RUN_ROUTING" == "1" ]]; then action "Tool routing batch" python scripts/run_tool_routing_batch.py \ --models "$MODELS" \ --agent "$ROUTER_AGENT" \ --agent-cards "$ROUTER_AGENT_CARDS" \ --timeout "$TIMEOUT" fi if [[ "$RUN_DESC_AB" == "1" ]]; then action "Tool description A/B" python scripts/eval_tool_description_ab.py \ --models "$MODELS" \ --timeout "$TIMEOUT" action "Tool description plots + interpretation" python scripts/plot_tool_description_eval.py fi action "Done" echo "See docs/RESULTS.md for report locations."