awesome-loop-engineering / examples /cost-control-loop.json

Sync awesome-loop-engineering

9ec4919 verified 1 day ago

2.93 kB

	{
	"name": "Cost control",
	"objective": "Keep long-running agent workflows within budget by measuring usage, identifying waste, and proposing scoped efficiency improvements.",
	"trigger": {
	"type": "scheduled",
	"cadence_or_event": "Daily or weekly usage review, and when spend, tokens, retries, or runtime exceed thresholds for a workflow."
	},
	"intake": {
	"sources": ["token and model usage", "tool-call counts", "retry volume", "trace IDs", "billing exports", "recent workflow changes"],
	"selection_rule": "Cluster usage by workflow, task type, model, and retry cause; investigate only clusters that exceed budget policy or baseline."
	},
	"workspace": {
	"isolation": "Read-only access to traces, billing exports, dashboards, and workflow configs.",
	"allowed_actions": ["analyze usage", "inspect traces", "propose config or prompt changes", "verify against representative tasks"],
	"disallowed_actions": ["silent quality-reducing changes", "disabling verification gates", "production routing changes"]
	},
	"context": {
	"required_files": ["budget policy", "accepted cost exceptions"],
	"runtime_sources": ["baseline spend window", "trace samples", "recent prompt and harness changes"]
	},
	"agents": [
	{
	"role": "Analyst",
	"responsibility": "Cluster usage by workflow, task type, model, tool, and retry cause."
	},
	{
	"role": "Investigator",
	"responsibility": "Inspect traces for context bloat, repeated failures, and missing stop conditions."
	},
	{
	"role": "Optimizer",
	"responsibility": "Propose the smallest change: smaller context, cheaper routing, caching, batching, or early exit."
	},
	{
	"role": "Verifier",
	"responsibility": "Rerun sample tasks or evals to confirm quality is preserved."
	}
	],
	"verification": {
	"gates": ["before/after usage measured on a comparable task mix", "quality gates and evals still pass", "savings estimates include uncertainty and sample size", "verification and escalation remain intact"],
	"receipts": ["baseline spend", "usage clusters", "trace samples", "before/after metrics", "verification results"]
	},
	"state": {
	"artifacts": ["cost review report", "accepted-exception ledger"],
	"update_rule": "Record baseline, suspected causes, proposed changes, and verification evidence after each review."
	},
	"budget": {
	"max_retries": 2,
	"max_runtime_minutes": 60
	},
	"escalation": {
	"conditions": ["quality tradeoff required", "model-routing policy change", "customer impact", "unknown spend source"],
	"destination": "Workflow owner with before/after evidence and rollout plan"
	},
	"exit": {
	"success": "Spend returns below threshold, or a verified scoped optimization is proposed with evidence.",
	"stop_without_success": "The cause is explained but the fix requires owner approval, or retries are exhausted."
	}
	}