| { |
| "name": "Cost control", |
| "objective": "Keep long-running agent workflows within budget by measuring usage, identifying waste, and proposing scoped efficiency improvements.", |
| "trigger": { |
| "type": "scheduled", |
| "cadence_or_event": "Daily or weekly usage review, and when spend, tokens, retries, or runtime exceed thresholds for a workflow." |
| }, |
| "intake": { |
| "sources": ["token and model usage", "tool-call counts", "retry volume", "trace IDs", "billing exports", "recent workflow changes"], |
| "selection_rule": "Cluster usage by workflow, task type, model, and retry cause; investigate only clusters that exceed budget policy or baseline." |
| }, |
| "workspace": { |
| "isolation": "Read-only access to traces, billing exports, dashboards, and workflow configs.", |
| "allowed_actions": ["analyze usage", "inspect traces", "propose config or prompt changes", "verify against representative tasks"], |
| "disallowed_actions": ["silent quality-reducing changes", "disabling verification gates", "production routing changes"] |
| }, |
| "context": { |
| "required_files": ["budget policy", "accepted cost exceptions"], |
| "runtime_sources": ["baseline spend window", "trace samples", "recent prompt and harness changes"] |
| }, |
| "agents": [ |
| { |
| "role": "Analyst", |
| "responsibility": "Cluster usage by workflow, task type, model, tool, and retry cause." |
| }, |
| { |
| "role": "Investigator", |
| "responsibility": "Inspect traces for context bloat, repeated failures, and missing stop conditions." |
| }, |
| { |
| "role": "Optimizer", |
| "responsibility": "Propose the smallest change: smaller context, cheaper routing, caching, batching, or early exit." |
| }, |
| { |
| "role": "Verifier", |
| "responsibility": "Rerun sample tasks or evals to confirm quality is preserved." |
| } |
| ], |
| "verification": { |
| "gates": ["before/after usage measured on a comparable task mix", "quality gates and evals still pass", "savings estimates include uncertainty and sample size", "verification and escalation remain intact"], |
| "receipts": ["baseline spend", "usage clusters", "trace samples", "before/after metrics", "verification results"] |
| }, |
| "state": { |
| "artifacts": ["cost review report", "accepted-exception ledger"], |
| "update_rule": "Record baseline, suspected causes, proposed changes, and verification evidence after each review." |
| }, |
| "budget": { |
| "max_retries": 2, |
| "max_runtime_minutes": 60 |
| }, |
| "escalation": { |
| "conditions": ["quality tradeoff required", "model-routing policy change", "customer impact", "unknown spend source"], |
| "destination": "Workflow owner with before/after evidence and rollout plan" |
| }, |
| "exit": { |
| "success": "Spend returns below threshold, or a verified scoped optimization is proposed with evidence.", |
| "stop_without_success": "The cause is explained but the fix requires owner approval, or retries are exhausted." |
| } |
| } |
|
|