cy0307 commited on
Commit
9ec4919
·
verified ·
1 Parent(s): 5c06dfd

Sync awesome-loop-engineering

Browse files

Initial sync from GitHub repository ChaoYue0307/awesome-loop-engineering.

This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ assets/awesome-loop-engineering-cover.png filter=lfs diff=lfs merge=lfs -text
.github/ISSUE_TEMPLATE/config.yml ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ blank_issues_enabled: false
2
+ contact_links:
3
+ - name: Community pattern discussion
4
+ url: https://github.com/ChaoYue0307/awesome-loop-engineering/issues/1
5
+ about: Share real-world Loop Engineering patterns, examples, and lessons learned.
6
+ - name: Open a pull request
7
+ url: https://github.com/ChaoYue0307/awesome-loop-engineering/compare
8
+ about: If you already know where the resource belongs, a pull request is preferred.
9
+ - name: Support guide
10
+ url: https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/SUPPORT.md
11
+ about: Choose the right support, correction, translation, or security channel.
.github/ISSUE_TEMPLATE/pattern-suggestion.yml ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Loop pattern suggestion
2
+ description: Suggest a recurring AI-agent loop pattern for the pattern library.
3
+ title: "[Pattern]: "
4
+ labels:
5
+ - pattern-suggestion
6
+ body:
7
+ - type: input
8
+ id: name
9
+ attributes:
10
+ label: Pattern name
11
+ description: Short name for the loop pattern.
12
+ placeholder: PR babysitter
13
+ validations:
14
+ required: true
15
+ - type: textarea
16
+ id: objective
17
+ attributes:
18
+ label: Objective
19
+ description: What outcome should this loop optimize for?
20
+ placeholder: Keep an open PR moving toward merge readiness without repeated human polling.
21
+ validations:
22
+ required: true
23
+ - type: textarea
24
+ id: trigger
25
+ attributes:
26
+ label: Trigger
27
+ description: What starts the loop?
28
+ placeholder: Schedule, webhook, failed check, new review comment, release event, or manual bootstrap command.
29
+ validations:
30
+ required: true
31
+ - type: textarea
32
+ id: intake
33
+ attributes:
34
+ label: Discover / intake
35
+ description: Where does the loop find work?
36
+ placeholder: GitHub PR comments, CI failures, Linear tickets, logs, alerts, feedback streams.
37
+ validations:
38
+ required: true
39
+ - type: textarea
40
+ id: delegation
41
+ attributes:
42
+ label: Agents and delegation
43
+ description: Which agent roles are involved and how is work handed off?
44
+ placeholder: Explorer identifies blockers, Implementer patches, Reviewer checks scope, Judge decides next action.
45
+ validations:
46
+ required: true
47
+ - type: textarea
48
+ id: verification
49
+ attributes:
50
+ label: Verification gates
51
+ description: What says yes or no?
52
+ placeholder: Required checks pass, examples run, dashboard thresholds hold, reviewer approves, trace grader passes.
53
+ validations:
54
+ required: true
55
+ - type: textarea
56
+ id: state
57
+ attributes:
58
+ label: Durable state
59
+ description: What survives the next run?
60
+ placeholder: Progress file, issue comment, database checkpoint, trace, status report, processed IDs.
61
+ validations:
62
+ required: true
63
+ - type: textarea
64
+ id: budget
65
+ attributes:
66
+ label: Budget and exit
67
+ description: When should the loop stop?
68
+ placeholder: Max retries, max runtime, success condition, stop-without-success condition.
69
+ validations:
70
+ required: true
71
+ - type: textarea
72
+ id: escalation
73
+ attributes:
74
+ label: Escalation
75
+ description: When should a human take over and where should the loop report?
76
+ placeholder: Missing credentials, architecture judgment, production approval, repeated failure, unclear ownership.
77
+ validations:
78
+ required: true
79
+ - type: checkboxes
80
+ id: checklist
81
+ attributes:
82
+ label: Checklist
83
+ options:
84
+ - label: This is a recurring AI-agent loop, not a one-off prompt or generic automation.
85
+ required: true
86
+ - label: The pattern includes trigger, intake, delegation, verification, durable state, budget, escalation, and exit.
87
+ required: true
88
+ - label: The pattern has at least one concrete verification gate stronger than model self-assessment.
89
+ required: true
90
+ - label: Sensitive actions are human-approved or explicitly out of scope.
91
+ required: true
.github/ISSUE_TEMPLATE/resource-suggestion.yml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Resource suggestion
2
+ description: Suggest a paper, blog, note, tool, benchmark, or critique for the list.
3
+ title: "[Resource]: "
4
+ labels:
5
+ - resource-suggestion
6
+ body:
7
+ - type: input
8
+ id: title
9
+ attributes:
10
+ label: Resource title
11
+ description: The title of the resource.
12
+ placeholder: Loop Engineering
13
+ validations:
14
+ required: true
15
+ - type: input
16
+ id: url
17
+ attributes:
18
+ label: URL
19
+ description: Public, stable URL for the resource.
20
+ placeholder: https://example.com
21
+ validations:
22
+ required: true
23
+ - type: dropdown
24
+ id: category
25
+ attributes:
26
+ label: Suggested category
27
+ options:
28
+ - Start Here
29
+ - Core Loop Primitives
30
+ - Official Runtime Guides
31
+ - Research Foundations
32
+ - Agent Workflow Patterns
33
+ - Coding-Agent Loop Systems
34
+ - Verification And Feedback Gates
35
+ - State, Memory, And Context Persistence
36
+ - Orchestration And Multi-Agent Delegation
37
+ - Benchmarks And Evaluation
38
+ - Operations Playbooks
39
+ - Templates And Patterns
40
+ - Critiques, Risks, And Limitations
41
+ - Adjacent Awesome Lists
42
+ - Not sure
43
+ validations:
44
+ required: true
45
+ - type: dropdown
46
+ id: source_type
47
+ attributes:
48
+ label: Resource type
49
+ options:
50
+ - 📄 Paper
51
+ - 📝 Blog
52
+ - 📚 Docs
53
+ - 🧰 Tool
54
+ - 🧪 Benchmark
55
+ - 🔁 Pattern
56
+ - 🧾 Template
57
+ - 🧭 List
58
+ - ⚠️ Critique
59
+ - Other
60
+ validations:
61
+ required: true
62
+ - type: dropdown
63
+ id: quality_label
64
+ attributes:
65
+ label: Quality label
66
+ description: Choose the strongest reason this source is useful.
67
+ options:
68
+ - Primary source
69
+ - Official docs
70
+ - Implementation-heavy
71
+ - Foundational
72
+ - Cautionary
73
+ - Adjacent
74
+ - Not sure
75
+ validations:
76
+ required: true
77
+ - type: textarea
78
+ id: relevance
79
+ attributes:
80
+ label: Why it belongs
81
+ description: Explain how this resource helps people design recurring agent systems above prompt, context, and harness engineering.
82
+ placeholder: This belongs because...
83
+ validations:
84
+ required: true
85
+ - type: dropdown
86
+ id: evidence_quality
87
+ attributes:
88
+ label: Evidence quality
89
+ description: Prefer primary, practical, and implementation-oriented sources.
90
+ options:
91
+ - Tier A - primary source or official docs
92
+ - Tier B - practitioner write-up with implementation detail
93
+ - Tier C - curated survey or high-quality explainer
94
+ - Tier D - commentary or news coverage
95
+ - Not sure
96
+ validations:
97
+ required: true
98
+ - type: checkboxes
99
+ id: checklist
100
+ attributes:
101
+ label: Checklist
102
+ options:
103
+ - label: This is about AI/coding-agent Loop Engineering or a direct foundation for recurring agent systems.
104
+ required: true
105
+ - label: If this is adjacent prompt, context, or harness content, it clearly connects to repeated runs, state, verification, or escalation.
106
+ required: true
107
+ - label: This is not about unrelated event loops, growth loops, or generic automation.
108
+ required: true
109
+ - label: I checked that the resource is not already listed.
110
+ required: true
.github/ISSUE_TEMPLATE/translation.yml ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Translation proposal
2
+ description: Propose a new translation or volunteer to maintain one.
3
+ title: "[Translation]: "
4
+ labels:
5
+ - translation
6
+ body:
7
+ - type: input
8
+ id: language
9
+ attributes:
10
+ label: Language
11
+ description: Which language do you want to add or maintain?
12
+ placeholder: Japanese
13
+ validations:
14
+ required: true
15
+ - type: input
16
+ id: file
17
+ attributes:
18
+ label: Proposed file name
19
+ description: See TRANSLATIONS.md for suggested names.
20
+ placeholder: README.ja.md
21
+ validations:
22
+ required: true
23
+ - type: textarea
24
+ id: scope
25
+ attributes:
26
+ label: Translation scope
27
+ description: What will you translate first?
28
+ placeholder: Introduction, Loop Contract, maturity model, contribution instructions...
29
+ validations:
30
+ required: true
31
+ - type: checkboxes
32
+ id: checklist
33
+ attributes:
34
+ label: Checklist
35
+ options:
36
+ - label: I will preserve the narrow AI/coding-agent scope.
37
+ required: true
38
+ - label: I will link back to the canonical English README.
39
+ required: true
40
+ - label: I will keep resource URLs unchanged.
41
+ required: true
.github/pull_request_template.md ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Pull Request
2
+
3
+ ## What Changed
4
+
5
+ Select all that apply.
6
+
7
+ - [ ] Added or updated resource entries
8
+ - [ ] Added or updated a loop pattern
9
+ - [ ] Added or updated a translation
10
+ - [ ] Improved docs, templates, or repository presentation
11
+ - [ ] Fixed links, typos, or formatting
12
+
13
+ ## Resource Summary
14
+
15
+ List the resources, patterns, or translation files changed.
16
+
17
+ - Title and URL:
18
+
19
+ ## Relevance To Loop Engineering
20
+
21
+ Explain how this PR relates to the new AI/coding-agent meaning of Loop Engineering: the layer above prompt, context, and harness engineering where recurring systems trigger agents, provide context, bound actions, verify results, persist state, retry, and escalate.
22
+
23
+ ## Category
24
+
25
+ Which README section did you update?
26
+
27
+ - [ ] Start Here
28
+ - [ ] Core Loop Primitives
29
+ - [ ] Official Runtime Guides
30
+ - [ ] Research Foundations
31
+ - [ ] Agent Workflow Patterns
32
+ - [ ] Coding-Agent Loop Systems
33
+ - [ ] Verification And Feedback Gates
34
+ - [ ] State, Memory, And Context Persistence
35
+ - [ ] Orchestration And Multi-Agent Delegation
36
+ - [ ] Benchmarks And Evaluation
37
+ - [ ] Operations Playbooks
38
+ - [ ] Templates And Patterns
39
+ - [ ] Critiques, Risks, And Limitations
40
+ - [ ] Adjacent Awesome Lists
41
+ - [ ] Translation or repository docs
42
+
43
+ ## Source Type
44
+
45
+ - [ ] 📄 Paper
46
+ - [ ] 📝 Blog
47
+ - [ ] 📚 Docs
48
+ - [ ] 🧰 Tool
49
+ - [ ] 🧪 Benchmark
50
+ - [ ] 🔁 Pattern
51
+ - [ ] 🧾 Template
52
+ - [ ] 🧭 List
53
+ - [ ] ⚠️ Critique
54
+
55
+ ## Quality Labels
56
+
57
+ - [ ] Direct Loop Engineering source
58
+ - [ ] Paper or technical report
59
+ - [ ] Official documentation
60
+ - [ ] Engineering blog or field note
61
+ - [ ] Tool, framework, or repository
62
+ - [ ] Benchmark or evaluation resource
63
+ - [ ] Critique or limitation analysis
64
+ - [ ] Adjacent awesome list
65
+ - [ ] Primary source
66
+ - [ ] Implementation-heavy
67
+ - [ ] Foundational
68
+ - [ ] Cautionary
69
+ - [ ] Translation
70
+ - [ ] Repository maintenance
71
+
72
+ ## Evidence Quality
73
+
74
+ - [ ] Tier A: primary source or official docs
75
+ - [ ] Tier B: practitioner write-up with implementation detail
76
+ - [ ] Tier C: curated survey or high-quality explainer
77
+ - [ ] Tier D: commentary or news coverage
78
+
79
+ ## Checklist
80
+
81
+ - [ ] I searched the README for duplicates.
82
+ - [ ] The resource is public and has a stable URL.
83
+ - [ ] The entry is in the most specific category.
84
+ - [ ] The entry includes the correct resource type label, such as `📄 **Paper**` or `📚 **Docs**`.
85
+ - [ ] The annotation explains why the resource matters for loop design.
86
+ - [ ] Adjacent prompt, context, or harness resources explicitly connect to repeated agent runs, state, verification, or escalation.
87
+ - [ ] The entry follows the format: `- 📄 **Paper** [Title](https://example.com) - One sentence annotation.`
88
+ - [ ] The resource is not about unrelated event loops, growth loops, control theory, or generic automation.
89
+ - [ ] New loop patterns include trigger, discover/intake, delegation, state, verification gates, retry budget, escalation path, and loop instruction or automation artifact.
90
+ - [ ] I agree that my contribution to this repository is released under `CC0-1.0`.
91
+ - [ ] I did not copy third-party content into this repository without the right to do so.
92
+ - [ ] Any translation links back to the canonical English README.
.github/workflows/quality.yml ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Quality
2
+
3
+ on:
4
+ pull_request:
5
+ push:
6
+ branches:
7
+ - main
8
+ schedule:
9
+ - cron: "17 3 * * 1"
10
+ workflow_dispatch:
11
+
12
+ permissions:
13
+ contents: read
14
+
15
+ concurrency:
16
+ group: quality-${{ github.ref }}
17
+ cancel-in-progress: true
18
+
19
+ jobs:
20
+ docs:
21
+ name: Docs quality gates
22
+ runs-on: ubuntu-latest
23
+ permissions:
24
+ contents: read
25
+ issues: write
26
+ env:
27
+ FORCE_JAVASCRIPT_ACTIONS_TO_NODE24: "true"
28
+ steps:
29
+ - name: Check out repository
30
+ uses: actions/checkout@v4
31
+
32
+ - name: Set up Python
33
+ uses: actions/setup-python@v5
34
+ with:
35
+ python-version: "3.x"
36
+
37
+ - name: Check Markdown formatting
38
+ uses: DavidAnson/markdownlint-cli2-action@v17
39
+ with:
40
+ globs: "**/*.md"
41
+
42
+ - name: Check Awesome list standards
43
+ run: npx --yes awesome-lint
44
+
45
+ - name: Check license text
46
+ run: python scripts/check_license.py
47
+
48
+ - name: Check resource type labels
49
+ run: python scripts/check_resource_labels.py README.md
50
+
51
+ - name: Check loop contract examples
52
+ run: |
53
+ python scripts/check_loop_contract_examples.py
54
+ python scripts/preview_loop_contract.py examples/pr-babysitter-loop.json >/tmp/pr-babysitter-preview.md
55
+
56
+ - name: Check Pages metadata
57
+ run: python scripts/check_pages_metadata.py
58
+
59
+ - name: Check internal links
60
+ run: python scripts/check_internal_links.py
61
+
62
+ - name: Check translation sync markers
63
+ run: python scripts/check_translation_sync.py
64
+
65
+ - name: Check links
66
+ run: python scripts/verify_urls.py . --timeout 12 --workers 20
67
+
68
+ - name: Check main commit identity
69
+ if: github.event_name == 'push' && github.ref == 'refs/heads/main'
70
+ run: python scripts/check_commit_identity.py
71
+
72
+ - name: Open an issue when a scheduled run fails
73
+ if: failure() && github.event_name == 'schedule'
74
+ env:
75
+ GH_TOKEN: ${{ github.token }}
76
+ run: |
77
+ gh issue create \
78
+ --repo "$GITHUB_REPOSITORY" \
79
+ --title "Scheduled quality run failed on $(date -u +%Y-%m-%d)" \
80
+ --body "The weekly quality workflow failed, most likely a dead link or a stale translation sync marker. See the run: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"
.gitignore ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ __pycache__/
2
+ *.py[cod]
.markdownlint.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "MD013": false,
3
+ "MD033": false,
4
+ "MD060": false
5
+ }
AGENTS.md ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Repository Guidance For AI Agents
2
+
3
+ This repository curates resources for the new AI/coding-agent meaning of **Loop Engineering**.
4
+
5
+ ## Scope
6
+
7
+ Include resources that help readers design, run, verify, evaluate, or critique recurring AI-agent systems that sit above prompt, context, and harness engineering. A good entry should explain how a loop discovers work, delegates to agents, supplies context, bounds tools and permissions, verifies results, persists state, decides next actions, retries, or escalates.
8
+
9
+ Do not include unrelated uses of "loop":
10
+
11
+ - software event loops;
12
+ - UI/game loops;
13
+ - control theory;
14
+ - growth loops;
15
+ - generic workflow automation;
16
+ - non-AI feedback loops.
17
+
18
+ ## Editing Rules
19
+
20
+ - Keep `README.md` as the canonical English source.
21
+ - Preserve the four-layer framing when editing the intro, scope, or mental model: prompt, context, and harness engineering improve one run; Loop Engineering governs repeated agent work over time.
22
+ - Keep annotations short, specific, and builder-oriented.
23
+ - Prefer primary sources, official docs, papers, and implementation-heavy write-ups.
24
+ - If a resource is generic agent, prompt, context, or harness content, include it only when the annotation clearly explains its loop-design relevance.
25
+ - Update `README.zh-CN.md` only for translated overview content; do not let it drift into a separate resource list unless maintained.
26
+ - When adding a new category, update `README.md`, `CONTRIBUTING.md`, PR templates, and issue templates together.
27
+ - Do not add generated marketing copy or unsupported hype.
28
+
29
+ ## Commit Identity Rule
30
+
31
+ Never create commits with AI-assistant co-author trailers or any non-owner author/committer identity. All commits in this repository must be authored and committed as `ChaoYue0307 <hechaoyue0307@gmail.com>`.
32
+
33
+ When committing from an AI agent, do not use plain `git commit` if the environment may append co-author trailers. Create commits with explicit identity instead:
34
+
35
+ ```sh
36
+ git add <files>
37
+ PARENT="$(git rev-parse HEAD)"
38
+ TREE="$(git write-tree)"
39
+ NEW="$(GIT_AUTHOR_NAME='ChaoYue0307' GIT_AUTHOR_EMAIL='hechaoyue0307@gmail.com' GIT_COMMITTER_NAME='ChaoYue0307' GIT_COMMITTER_EMAIL='hechaoyue0307@gmail.com' git commit-tree "$TREE" -p "$PARENT" -m "Commit message")"
40
+ git update-ref refs/heads/main "$NEW" "$PARENT"
41
+ ```
42
+
43
+ Before pushing, verify:
44
+
45
+ ```sh
46
+ python scripts/check_commit_identity.py
47
+ ```
48
+
49
+ ## Entry Format
50
+
51
+ ```md
52
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
53
+ ```
54
+
55
+ ## Quality Preference
56
+
57
+ When two sources overlap, prefer:
58
+
59
+ 1. primary source or official docs;
60
+ 2. implementation details over commentary;
61
+ 3. stable URLs over social posts;
62
+ 4. practical loop design over broad AI-agent trend coverage.
ANTI-PATTERNS.md ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Loop Engineering Anti-Patterns
2
+
3
+ Use this page to reject unsafe, vague, or misleading loop designs.
4
+
5
+ ## Prompt Loop With No Contract
6
+
7
+ **Symptom:** A script repeatedly asks an agent to "keep improving" without a named objective, intake, state, verification, or exit condition.
8
+
9
+ **Why it fails:** The loop becomes a manual prompting habit disguised as automation.
10
+
11
+ **Better:** Define the loop contract before running: objective, trigger, intake, workspace, context, delegation, verification, state, budget, escalation, and exit.
12
+
13
+ ## Infinite Retry Loop
14
+
15
+ **Symptom:** The loop keeps feeding failures back to the agent indefinitely.
16
+
17
+ **Why it fails:** Cost grows, context degrades, and the loop may repeatedly damage the same files.
18
+
19
+ **Better:** Set retry budgets per blocker, stop on repeated failures, and escalate with evidence.
20
+
21
+ ## Model Self-Approval
22
+
23
+ **Symptom:** The same agent that made the change decides that the work is complete.
24
+
25
+ **Why it fails:** Models can rationalize their own mistakes and miss regressions they introduced.
26
+
27
+ **Better:** Use deterministic checks, a separate verifier agent, or human review for completion gates.
28
+
29
+ ## Hidden State
30
+
31
+ **Symptom:** The only memory is inside the conversation.
32
+
33
+ **Why it fails:** The next run cannot reliably know what was tried, what passed, what failed, or what remains.
34
+
35
+ **Better:** Persist state in files, issues, comments, checkpoints, traces, or workflow state.
36
+
37
+ ## Unsafe Production Autonomy
38
+
39
+ **Symptom:** A loop can deploy, roll back, change config, rotate secrets, or modify data without explicit approval boundaries.
40
+
41
+ **Why it fails:** A small model error can become an operational incident.
42
+
43
+ **Better:** Make sensitive actions approval-gated and document rollback, escalation, and owner rules.
44
+
45
+ ## Generic Automation Rebranded As Loop Engineering
46
+
47
+ **Symptom:** A cron job or workflow runs without agentic reasoning, context loading, verification, or stateful next-action decisions.
48
+
49
+ **Why it fails:** It blurs Loop Engineering with ordinary automation.
50
+
51
+ **Better:** Call ordinary automation ordinary automation. Use Loop Engineering when repeated agent work is actually being triggered, bounded, verified, persisted, and rerun.
52
+
53
+ ## Context Dump Loop
54
+
55
+ **Symptom:** Each run gives the agent a huge context bundle instead of a curated state contract.
56
+
57
+ **Why it fails:** The loop becomes slow, expensive, and hard to debug.
58
+
59
+ **Better:** Separate durable state from supporting context. Load only the state, docs, examples, and receipts needed for the current objective.
60
+
61
+ ## No Escalation Path
62
+
63
+ **Symptom:** The loop keeps acting even when it lacks credentials, sees ambiguous product requirements, hits flaky infrastructure, or needs architectural judgment.
64
+
65
+ **Why it fails:** The agent spends budget where a human decision is required.
66
+
67
+ **Better:** Define escalation triggers and include the evidence a human needs to take over.
68
+
69
+ ## No Receipts
70
+
71
+ **Symptom:** The loop says it is done without commands, logs, changed files, trace IDs, dashboard snapshots, reviewer decisions, or links.
72
+
73
+ **Why it fails:** Maintainers cannot audit the loop or trust its result.
74
+
75
+ **Better:** Require receipts as part of the exit gate.
CITATION.bib ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ @misc{chaoyue2026awesome_loop_engineering,
2
+ author = {He, Chaoyue},
3
+ title = {Awesome Loop Engineering},
4
+ year = {2026},
5
+ howpublished = {\url{https://github.com/ChaoYue0307/awesome-loop-engineering}},
6
+ note = {Curated resources for Loop Engineering}
7
+ }
CITATION.cff ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ cff-version: 1.2.0
2
+ message: "If this repository is useful in your work, please cite it as below."
3
+ title: "Awesome Loop Engineering"
4
+ type: software
5
+ authors:
6
+ - family-names: "He"
7
+ given-names: "Chaoyue"
8
+ repository-code: "https://github.com/ChaoYue0307/awesome-loop-engineering"
9
+ url: "https://chaoyue0307.github.io/awesome-loop-engineering/"
10
+ abstract: "Curated resources and practical patterns for Loop Engineering with AI and coding agents."
11
+ keywords:
12
+ - loop-engineering
13
+ - ai-agents
14
+ - coding-agents
15
+ - agentic-workflows
16
+ license: CC0-1.0
CODE_OF_CONDUCT.md ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Code Of Conduct
2
+
3
+ Awesome Loop Engineering is a technical curation project. Contributors should help keep discussions accurate, specific, and useful for builders.
4
+
5
+ ## Expected Behavior
6
+
7
+ - Be respectful and assume good intent.
8
+ - Keep feedback concrete and evidence-based.
9
+ - Prefer primary sources and verifiable claims.
10
+ - Disclose caveats such as vendor bias, paywalls, unstable links, or weak evidence.
11
+ - Respect maintainers' scope decisions when a resource is not specific to AI/coding-agent Loop Engineering.
12
+
13
+ ## Unacceptable Behavior
14
+
15
+ - Harassment, insults, threats, or discriminatory language.
16
+ - Spam, link farming, or promotional submissions without technical substance.
17
+ - Posting secrets, private customer data, credentials, or internal-only links.
18
+ - Misrepresenting a source, author, benchmark, tool, or affiliation.
19
+ - Repeatedly pushing unrelated event-loop, growth-loop, control-theory, or generic automation content into scope.
20
+
21
+ ## Enforcement
22
+
23
+ Maintainers may edit, close, or remove issues, pull requests, comments, or links that violate this code of conduct or the repository scope. Serious or repeated violations may lead to blocked participation.
24
+
25
+ ## Reporting
26
+
27
+ If a discussion becomes unsafe or inappropriate, open an issue with sensitive details removed, or contact the maintainer through GitHub. For security-sensitive concerns, follow `SECURITY.md`.
COMPARISON.md ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Comparison Guide
2
+
3
+ Loop Engineering is easiest to understand by separating it from nearby practices.
4
+
5
+ ## Prompt Engineering vs Loop Engineering
6
+
7
+ **Prompt Engineering** asks: what should I say to the model now?
8
+
9
+ **Loop Engineering** asks: what system should discover work, delegate to agents, verify results, persist state, decide next actions, and rerun?
10
+
11
+ Prompt engineering can be part of a loop instruction, but a good prompt alone is not a loop.
12
+
13
+ ## Context Engineering vs Loop Engineering
14
+
15
+ **Context Engineering** asks: what state, memory, documents, examples, and tool results should the model see?
16
+
17
+ **Loop Engineering** asks: when should context be loaded, what state should survive across runs, and how should that state affect the next run?
18
+
19
+ Context engineering improves the input to an agent. Loop Engineering governs recurring agent work over time.
20
+
21
+ ## Harness Engineering vs Loop Engineering
22
+
23
+ **Harness Engineering** asks: what tools, permissions, sandboxes, tests, traces, and feedback surround one agent run?
24
+
25
+ **Loop Engineering** asks: how should repeated agent runs use those harnesses to act, verify, record receipts, retry, and escalate?
26
+
27
+ Harness engineering makes a run safer and more observable. Loop Engineering decides when and why that run happens again.
28
+
29
+ ## Workflow Automation vs Loop Engineering
30
+
31
+ **Workflow automation** executes predefined steps.
32
+
33
+ **Loop Engineering** coordinates agentic work that may require discovery, delegation, tool use, verification, state updates, and next-action decisions.
34
+
35
+ Many loops use workflow automation. Not every workflow automation is Loop Engineering.
36
+
37
+ ## Agent Workflow vs Loop Engineering
38
+
39
+ **Agent workflows** describe how models, tools, and agents solve a task.
40
+
41
+ **Loop Engineering** describes how work recurs: what triggers it, what state persists, what gates completion, when retry is allowed, and when humans take over.
42
+
43
+ An agent workflow can be the inner mechanism. The loop is the operating system around repeated work.
44
+
45
+ ## Evaluation Loop vs Operational Loop
46
+
47
+ **Evaluation loops** repeatedly measure and improve prompts, tools, models, or harnesses.
48
+
49
+ **Operational loops** repeatedly perform engineering work such as PR babysitting, CI repair, docs drift collection, feedback clustering, or deploy verification.
50
+
51
+ Both are valid Loop Engineering patterns when they have a clear trigger, state, verification, budget, and exit.
52
+
53
+ ## Quick Test
54
+
55
+ Ask these questions before calling something Loop Engineering:
56
+
57
+ 1. Does it run more than once by design?
58
+ 1. Does it discover or receive work from a real source?
59
+ 1. Does it delegate work to one or more agents?
60
+ 1. Does it verify results with explicit gates?
61
+ 1. Does it persist state or receipts outside the model context?
62
+ 1. Does it decide whether to repeat, report, escalate, or stop?
63
+
64
+ If the answer is mostly no, it may be prompt engineering, context engineering, harness engineering, or automation, but it is probably not Loop Engineering.
CONTRIBUTING.md ADDED
@@ -0,0 +1,172 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Contributing
2
+
3
+ Thanks for helping improve Awesome Loop Engineering.
4
+
5
+ This repository is intentionally narrow. It tracks the new AI and coding-agent meaning of **Loop Engineering**: the layer above prompt, context, and harness engineering where teams design systems that discover work, delegate to agents, verify outcomes, persist state, decide next actions, and run again on a cadence or until a goal is met.
6
+
7
+ Before submitting, read the [curation standard](meta/CURATION.md). Maintainers use it to decide whether a resource is specific, stable, and useful enough for the list.
8
+
9
+ ## Quick PR Flow
10
+
11
+ 1. Search `README.md` for the resource title, author, project, and URL.
12
+ 1. Confirm the resource is about AI/coding-agent Loop Engineering or a direct foundation for it.
13
+ 1. Pick the most specific category.
14
+ 1. Add one entry with a resource type label:
15
+
16
+ ```md
17
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
18
+ ```
19
+
20
+ 1. Open a PR using the template and explain:
21
+ - why the resource belongs;
22
+ - which category it updates;
23
+ - whether it is a primary source, official documentation, paper, tool, benchmark, playbook, critique, or adjacent list;
24
+ - the evidence quality tier and resource type label;
25
+ - any caveat such as vendor bias, paywall, early-stage status, or weak evidence.
26
+
27
+ ## License For Contributions
28
+
29
+ By contributing to this repository, you agree that your contribution to this repository's curation text, annotations, templates, patterns, metadata, and documentation is released under [CC0-1.0](LICENSE).
30
+
31
+ Do not copy third-party articles, papers, images, documentation, code, or other content into this repository unless you have the right to do so. Prefer stable links and short original annotations. External resources keep their own licenses and terms.
32
+
33
+ ## What Belongs Here
34
+
35
+ Good additions usually fit one of these groups:
36
+
37
+ - Direct explanations of Loop Engineering in the AI/coding-agent sense.
38
+ - Papers that introduce agent loops, reflection, critique, verification, planning, tool use, or memory patterns used by looped agents.
39
+ - Official docs for agent runtimes, hooks, subagents, skills, guardrails, observability, MCP, worktrees, automations, goals, or state persistence.
40
+ - Engineering blogs with concrete implementation details, failure modes, or production lessons.
41
+ - Benchmarks and eval systems for long-horizon, tool-using, or coding agents.
42
+ - Playbooks for recurring agent work such as PR babysitting, CI repair, issue triage, deploy verification, bug hunting, docs drift collection, and feedback clustering.
43
+ - Critiques that clarify when loops are risky, wasteful, or not yet justified.
44
+ - Translation improvements that make the concept accessible without changing the scope.
45
+
46
+ ## What Does Not Belong Here
47
+
48
+ Please avoid submitting:
49
+
50
+ - Software event loops, UI event loops, game loops, control theory loops, growth loops, or generic feedback-loop content unless it is explicitly applied to AI agent loops.
51
+ - Generic prompt engineering resources with no loop, tool, verification, state, or scheduling angle.
52
+ - Generic context or harness engineering resources unless they directly explain how repeated agent runs are triggered, verified, persisted, or governed.
53
+ - Resources that only improve single-turn prompts belong in prompt-engineering lists unless they show scheduling, state, verification, retries, or escalation.
54
+ - Generic agent news, product launches, or listicles without technical substance.
55
+ - Private, unstable, or paywalled sources that most readers cannot inspect.
56
+ - Duplicate resources already covered by an existing entry.
57
+ - Pure marketing pages with no reusable technical insight.
58
+
59
+ ## Evidence Quality
60
+
61
+ Prefer higher tiers when two resources cover the same idea.
62
+
63
+ | Tier | Source type | Examples |
64
+ | --- | --- | --- |
65
+ | A | Primary source or official docs | Tool docs, paper, project README, author write-up |
66
+ | B | Practitioner write-up with implementation detail | Field notes, playbooks, postmortems |
67
+ | C | Curated survey or high-quality explainer | Taxonomy, comparison, tutorial |
68
+ | D | Commentary or news coverage | Useful only when it documents origin, adoption, or debate |
69
+
70
+ If two links say the same thing, prefer the more primary, practical, stable, and implementation-oriented one.
71
+
72
+ ## Quality Labels
73
+
74
+ Use these labels in PR descriptions and issue suggestions when they help reviewers understand why a resource belongs:
75
+
76
+ - **Primary source**: written by the original author, project, vendor, or research team.
77
+ - **Official docs**: documentation for a runtime, SDK, API, benchmark, or platform.
78
+ - **Implementation-heavy**: includes code, architecture, commands, traces, or operational details.
79
+ - **Foundational**: explains a core loop mechanism such as ReAct, reflection, planning, state, or verification.
80
+ - **Cautionary**: clarifies limitations, risks, cost, safety, or when not to use loops.
81
+ - **Adjacent**: useful context from prompt, context, harness, eval, or agent engineering.
82
+
83
+ ## Category Guidance
84
+
85
+ - Use **Start Here** only for direct Loop Engineering explainers.
86
+ - Use **The Loop Contract** and **Loop Maturity Model** only for framework-level content, not individual links.
87
+ - Use **Core Loop Primitives** for automations, goals, worktrees, hooks, skills, connectors, subagents, and state files.
88
+ - Use **Official Runtime Guides** for primary-source docs from tool builders.
89
+ - Use **Research Foundations** for papers and reference implementations that explain the mechanics behind agent loops.
90
+ - Use **Agent Workflow Patterns** for general workflow architecture, durable execution, and official guidance.
91
+ - Use **Coding-Agent Loop Systems** for systems that run agents over repositories, terminals, code, or software issues.
92
+ - Use **Verification And Feedback Gates** for tests, evals, CI, tracing, guardrails, deterministic checks, and LLM-as-judge caveats.
93
+ - Use **State, Memory, And Context Persistence** for durable state, checkpoints, context, progress files, and memory.
94
+ - Use **Orchestration And Multi-Agent Delegation** for subagents, handoffs, manager-worker loops, and workflow runtimes.
95
+ - Use **Benchmarks And Evaluation** for benchmarks that measure agent behavior over multi-step tasks.
96
+ - Use **Operations Playbooks** for recurring engineering jobs run by agents.
97
+ - Use **Templates And Patterns** for reusable pattern docs hosted in this repository.
98
+ - Use **Critiques, Risks, And Limitations** for thoughtful warnings and failure analysis.
99
+ - Use **Adjacent Awesome Lists** for neighboring maps, not individual resources.
100
+
101
+ ## Annotation Style
102
+
103
+ Keep annotations short, specific, and builder-oriented.
104
+
105
+ Use the resource type legend from `README.md`:
106
+
107
+ - 📄 **Paper**
108
+ - 📝 **Blog**
109
+ - 📚 **Docs**
110
+ - 🧰 **Tool**
111
+ - 🧪 **Benchmark**
112
+ - 🔁 **Pattern**
113
+ - 🧾 **Template**
114
+ - 🧭 **List**
115
+ - ⚠️ **Critique**
116
+
117
+ Prefer:
118
+
119
+ ```md
120
+ - 🔁 **Pattern** [Autonomous Loops](https://example.com) - Shows how to combine task files, stop hooks, limits, and kill switches into a self-continuing agent loop.
121
+ ```
122
+
123
+ Avoid:
124
+
125
+ ```md
126
+ - 📝 **Blog** [Cool Agent Article](https://example.com) - Interesting article about AI.
127
+ ```
128
+
129
+ ## Adding A Loop Pattern
130
+
131
+ For a practical loop pattern, use [`templates/loop-pattern.md`](templates/loop-pattern.md), optionally structure it with [`schemas/loop-contract.schema.json`](schemas/loop-contract.schema.json), and place the finished pattern in [`patterns/`](patterns/). A good pattern names:
132
+
133
+ - objective;
134
+ - trigger;
135
+ - intake source;
136
+ - agents and roles;
137
+ - workspace and permissions;
138
+ - verification gates;
139
+ - durable state;
140
+ - budget and exit conditions;
141
+ - escalation path;
142
+ - loop instruction, automation spec, hook config, or scheduled command;
143
+ - failure modes.
144
+
145
+ Pattern PRs should be concrete enough that a reader can adapt them to an agent runtime without guessing the loop contract. If you want feedback before writing the full pattern, open a loop pattern suggestion issue.
146
+
147
+ ## Translation Contributions
148
+
149
+ See [TRANSLATIONS.md](TRANSLATIONS.md).
150
+
151
+ Translation PRs should:
152
+
153
+ - link back to the canonical English README;
154
+ - preserve the narrow AI/coding-agent scope;
155
+ - keep resource URLs unchanged;
156
+ - update language navigation if a new language file is added;
157
+ - explain who can help maintain the translation.
158
+
159
+ ## Issues
160
+
161
+ If you do not want to open a PR, use the resource suggestion issue template. Please include:
162
+
163
+ - title and URL;
164
+ - suggested category;
165
+ - resource type label;
166
+ - evidence quality tier;
167
+ - why it is relevant to Loop Engineering;
168
+ - whether it is a direct Loop Engineering source, official docs, paper, engineering note, tool, benchmark, critique, or translation.
169
+
170
+ ## Review Standard
171
+
172
+ Maintainers may ask for stronger relevance, a more precise category, a better annotation, or removal of promotional language. The goal is to keep the list useful for people designing real agent loops, not to collect every AI-agent link on the internet.
DEFINITION.md ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Canonical Definition
2
+
3
+ Use this page when you need a short, stable definition of Loop Engineering.
4
+
5
+ ## Short Definition
6
+
7
+ **Loop Engineering** is the AI and coding-agent practice of designing recurring systems that discover work, delegate it to agents, verify results, persist state, decide next actions, and run again on a cadence, event, or until a verifiable goal is reached.
8
+
9
+ ## One-Sentence Positioning
10
+
11
+ Prompt engineering improves what you ask the model, context engineering improves what the model can see, harness engineering improves the environment around one agent run, and Loop Engineering governs repeated agent work over time.
12
+
13
+ ## Longer Definition
14
+
15
+ Loop Engineering sits above prompt, context, and harness engineering. It turns agent work from turn-by-turn human prompting into a reviewable operating contract: what starts the loop, where work comes from, which agents act, what context and tools they receive, how results are verified, what state survives, when retry is allowed, and when a human takes over.
16
+
17
+ ## Minimal Loop Test
18
+
19
+ A system is probably practicing Loop Engineering when it can answer:
20
+
21
+ 1. What triggers the loop?
22
+ 1. How does it discover or receive work?
23
+ 1. What context and tools does it give the agent?
24
+ 1. What is the workspace and permission boundary?
25
+ 1. What verifies success or failure?
26
+ 1. What state persists across runs?
27
+ 1. What budget limits retries, time, or cost?
28
+ 1. What causes escalation?
29
+ 1. What condition ends the loop?
30
+
31
+ ## Citation Note
32
+
33
+ If you cite this repository, use the BibTeX entry in [`README.md`](README.md#citation) or [`CITATION.bib`](CITATION.bib). If you quote the concept definition, prefer linking to this page so readers can see the scope boundary.
LICENSE ADDED
@@ -0,0 +1,121 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Creative Commons Legal Code
2
+
3
+ CC0 1.0 Universal
4
+
5
+ CREATIVE COMMONS CORPORATION IS NOT A LAW FIRM AND DOES NOT PROVIDE
6
+ LEGAL SERVICES. DISTRIBUTION OF THIS DOCUMENT DOES NOT CREATE AN
7
+ ATTORNEY-CLIENT RELATIONSHIP. CREATIVE COMMONS PROVIDES THIS
8
+ INFORMATION ON AN "AS-IS" BASIS. CREATIVE COMMONS MAKES NO WARRANTIES
9
+ REGARDING THE USE OF THIS DOCUMENT OR THE INFORMATION OR WORKS
10
+ PROVIDED HEREUNDER, AND DISCLAIMS LIABILITY FOR DAMAGES RESULTING FROM
11
+ THE USE OF THIS DOCUMENT OR THE INFORMATION OR WORKS PROVIDED
12
+ HEREUNDER.
13
+
14
+ Statement of Purpose
15
+
16
+ The laws of most jurisdictions throughout the world automatically confer
17
+ exclusive Copyright and Related Rights (defined below) upon the creator
18
+ and subsequent owner(s) (each and all, an "owner") of an original work of
19
+ authorship and/or a database (each, a "Work").
20
+
21
+ Certain owners wish to permanently relinquish those rights to a Work for
22
+ the purpose of contributing to a commons of creative, cultural and
23
+ scientific works ("Commons") that the public can reliably and without fear
24
+ of later claims of infringement build upon, modify, incorporate in other
25
+ works, reuse and redistribute as freely as possible in any form whatsoever
26
+ and for any purposes, including without limitation commercial purposes.
27
+ These owners may contribute to the Commons to promote the ideal of a free
28
+ culture and the further production of creative, cultural and scientific
29
+ works, or to gain reputation or greater distribution for their Work in
30
+ part through the use and efforts of others.
31
+
32
+ For these and/or other purposes and motivations, and without any
33
+ expectation of additional consideration or compensation, the person
34
+ associating CC0 with a Work (the "Affirmer"), to the extent that he or she
35
+ is an owner of Copyright and Related Rights in the Work, voluntarily
36
+ elects to apply CC0 to the Work and publicly distribute the Work under its
37
+ terms, with knowledge of his or her Copyright and Related Rights in the
38
+ Work and the meaning and intended legal effect of CC0 on those rights.
39
+
40
+ 1. Copyright and Related Rights. A Work made available under CC0 may be
41
+ protected by copyright and related or neighboring rights ("Copyright and
42
+ Related Rights"). Copyright and Related Rights include, but are not
43
+ limited to, the following:
44
+
45
+ i. the right to reproduce, adapt, distribute, perform, display,
46
+ communicate, and translate a Work;
47
+ ii. moral rights retained by the original author(s) and/or performer(s);
48
+ iii. publicity and privacy rights pertaining to a person's image or
49
+ likeness depicted in a Work;
50
+ iv. rights protecting against unfair competition in regards to a Work,
51
+ subject to the limitations in paragraph 4(a), below;
52
+ v. rights protecting the extraction, dissemination, use and reuse of data
53
+ in a Work;
54
+ vi. database rights (such as those arising under Directive 96/9/EC of the
55
+ European Parliament and of the Council of 11 March 1996 on the legal
56
+ protection of databases, and under any national implementation
57
+ thereof, including any amended or successor version of such
58
+ directive); and
59
+ vii. other similar, equivalent or corresponding rights throughout the
60
+ world based on applicable law or treaty, and any national
61
+ implementations thereof.
62
+
63
+ 2. Waiver. To the greatest extent permitted by, but not in contravention
64
+ of, applicable law, Affirmer hereby overtly, fully, permanently,
65
+ irrevocably and unconditionally waives, abandons, and surrenders all of
66
+ Affirmer's Copyright and Related Rights and associated claims and causes
67
+ of action, whether now known or unknown (including existing as well as
68
+ future claims and causes of action), in the Work (i) in all territories
69
+ worldwide, (ii) for the maximum duration provided by applicable law or
70
+ treaty (including future time extensions), (iii) in any current or future
71
+ medium and for any number of copies, and (iv) for any purpose whatsoever,
72
+ including without limitation commercial, advertising or promotional
73
+ purposes (the "Waiver"). Affirmer makes the Waiver for the benefit of each
74
+ member of the public at large and to the detriment of Affirmer's heirs and
75
+ successors, fully intending that such Waiver shall not be subject to
76
+ revocation, rescission, cancellation, termination, or any other legal or
77
+ equitable action to disrupt the quiet enjoyment of the Work by the public
78
+ as contemplated by Affirmer's express Statement of Purpose.
79
+
80
+ 3. Public License Fallback. Should any part of the Waiver for any reason
81
+ be judged legally invalid or ineffective under applicable law, then the
82
+ Waiver shall be preserved to the maximum extent permitted taking into
83
+ account Affirmer's express Statement of Purpose. In addition, to the
84
+ extent the Waiver is so judged Affirmer hereby grants to each affected
85
+ person a royalty-free, non transferable, non sublicensable, non exclusive,
86
+ irrevocable and unconditional license to exercise Affirmer's Copyright and
87
+ Related Rights in the Work (i) in all territories worldwide, (ii) for the
88
+ maximum duration provided by applicable law or treaty (including future
89
+ time extensions), (iii) in any current or future medium and for any number
90
+ of copies, and (iv) for any purpose whatsoever, including without
91
+ limitation commercial, advertising or promotional purposes (the
92
+ "License"). The License shall be deemed effective as of the date CC0 was
93
+ applied by Affirmer to the Work. Should any part of the License for any
94
+ reason be judged legally invalid or ineffective under applicable law, such
95
+ partial invalidity or ineffectiveness shall not invalidate the remainder
96
+ of the License, and in such case Affirmer hereby affirms that he or she
97
+ will not (i) exercise any of his or her remaining Copyright and Related
98
+ Rights in the Work or (ii) assert any associated claims and causes of
99
+ action with respect to the Work, in either case contrary to Affirmer's
100
+ express Statement of Purpose.
101
+
102
+ 4. Limitations and Disclaimers.
103
+
104
+ a. No trademark or patent rights held by Affirmer are waived, abandoned,
105
+ surrendered, licensed or otherwise affected by this document.
106
+ b. Affirmer offers the Work as-is and makes no representations or
107
+ warranties of any kind concerning the Work, express, implied,
108
+ statutory or otherwise, including without limitation warranties of
109
+ title, merchantability, fitness for a particular purpose, non
110
+ infringement, or the absence of latent or other defects, accuracy, or
111
+ the present or absence of errors, whether or not discoverable, all to
112
+ the greatest extent permissible under applicable law.
113
+ c. Affirmer disclaims responsibility for clearing rights of other persons
114
+ that may apply to the Work or any use thereof, including without
115
+ limitation any person's Copyright and Related Rights in the Work.
116
+ Further, Affirmer disclaims responsibility for obtaining any necessary
117
+ consents, permissions or other rights required for any use of the
118
+ Work.
119
+ d. Affirmer understands and acknowledges that Creative Commons is not a
120
+ party to this document and has no duty or obligation with respect to
121
+ this CC0 or use of the Work.
MAINTAINER_PICKS.md ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Maintainer Picks
2
+
3
+ Start here if you want a compact path through the repository.
4
+
5
+ ## Concept
6
+
7
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Direct framing of Loop Engineering as the layer above manual prompting and one floor above harness engineering.
8
+ - [Canonical Definition](DEFINITION.md) - Stable definition and scope test for quoting or explaining the concept.
9
+ - [Loop Engineering Manifesto](MANIFESTO.md) - Short statement of principles, non-goals, and success criteria.
10
+
11
+ ## Practice
12
+
13
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - Practical plan-edit-test-observe-repair-document-repeat runbook.
14
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - Scheduled loop mechanics for recurring prompts, monitors, reminders, and `/loop`.
15
+ - [PR babysitter pattern](patterns/pr-babysitter.md) - Concrete operational pattern for PR comments, CI, conflicts, and merge readiness.
16
+ - [CI repair loop pattern](patterns/ci-repair-loop.md) - Concrete operational pattern for turning failing checks into narrow verified patches.
17
+
18
+ ## Reliability
19
+
20
+ - [Stop Babysitting Your Coding Agent. Give It Backpressure.](https://generativeprogrammer.com/p/stop-babysitting-your-coding-agent) - Turns tests, linters, builds, traces, and other signals into feedback loops.
21
+ - [Building effective agents](https://www.anthropic.com/engineering/building-effective-agents) - Canonical workflow patterns and caution against unnecessary complexity.
22
+ - [Loop Engineering Anti-Patterns](ANTI-PATTERNS.md) - Failure modes to avoid before running agents repeatedly.
23
+
24
+ ## Reusable Artifacts
25
+
26
+ - [Loop contract schema](schemas/loop-contract.schema.json) - Machine-readable contract for recurring agent loops.
27
+ - [Example loop specs](examples/README.md) - Validated PR babysitter, CI repair, and docs drift loop examples.
28
+ - [Loop Gallery](gallery/README.md) - Community format for sharing real or anonymized loop examples.
MANIFESTO.md ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Loop Engineering Manifesto
2
+
3
+ Loop Engineering is the practice of designing recurring AI-agent systems that sit above prompt, context, and harness engineering.
4
+
5
+ Prompt engineering improves what you ask the model. Context engineering improves what the model can see. Harness engineering improves the tools, permissions, sandboxes, and checks around one agent run. Loop Engineering connects those layers over time: it defines when agents run, what work they discover, how work is delegated, how results are verified, what state survives, and when the system repeats, reports, or escalates.
6
+
7
+ ## Why It Exists
8
+
9
+ The leverage point in agent work is moving from writing better one-off prompts to designing better recurring systems. A useful loop can notice work, load the right context, act in an isolated workspace, verify against explicit gates, record receipts, and continue later without relying on a human to remember every intermediate step.
10
+
11
+ This does not remove engineering judgment. It moves judgment into the loop contract: objective, trigger, intake, workspace, context, delegation, verification, state, budget, escalation, and exit.
12
+
13
+ ## Core Commitments
14
+
15
+ - **Design the system, not just the next prompt.** The human should specify the operating contract, not manually steer every turn.
16
+ - **Make state external.** Progress files, issue comments, traces, checkpoints, and dashboards should outlive the model context.
17
+ - **Separate maker from checker.** The system that acts should not be the only system that decides whether the work is done.
18
+ - **Prefer deterministic gates.** Tests, typechecks, evals, dashboards, trace graders, and reviewer decisions are stronger than "looks good".
19
+ - **Bound autonomy.** Loops need budgets, allowed actions, disallowed actions, stop conditions, and escalation paths.
20
+ - **Keep receipts.** A loop should explain what it saw, what it changed, what it ran, what passed, what failed, and why it stopped.
21
+ - **Stay responsible.** A loop can delegate work, but ownership of quality, safety, and product judgment remains human.
22
+
23
+ ## What It Is Not
24
+
25
+ Loop Engineering is not a new name for every agent, cron job, workflow, or feedback system. It is not software event loops, growth loops, control theory, or generic automation. It is also not prompt engineering with repetition. A loop needs a trigger, work intake, durable state, verification, budget, and exit condition.
26
+
27
+ ## Success Standard
28
+
29
+ A Loop Engineering artifact is useful when another builder can answer:
30
+
31
+ 1. What starts the loop?
32
+ 1. How does it discover work?
33
+ 1. Which agent or role does what?
34
+ 1. What context and tools are available?
35
+ 1. What can it change safely?
36
+ 1. What verifies success or failure?
37
+ 1. What state is persisted for the next run?
38
+ 1. What is the retry budget?
39
+ 1. When does it escalate?
40
+ 1. When is it done?
41
+
42
+ If those answers are visible, the loop can be reviewed, shared, improved, and trusted.
QUOTES.md ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Sourced Signals And Quotes
2
+
3
+ This page records short sourced signals around the emerging Loop Engineering concept. It is not a substitute for the original sources. Use it to understand provenance, then read the linked material directly.
4
+
5
+ ## Addy Osmani
6
+
7
+ Source: [Loop Engineering](https://addyosmani.com/blog/loop-engineering/)
8
+
9
+ > "Loop engineering is replacing yourself as the person who prompts the agent. You design the system that does it instead."
10
+
11
+ Why it matters: This is a direct definition of the shift from manual prompting to designing the recurring system that prompts, checks, and continues.
12
+
13
+ The same article states:
14
+
15
+ > "Loop engineering sits one floor above the harness."
16
+
17
+ Why it matters: This anchors the repository's four-layer framing: prompt, context, and harness engineering improve agent runs; Loop Engineering governs repeated agent work over time.
18
+
19
+ ## Peter Steinberger
20
+
21
+ Source: Addy Osmani's [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) article reports this statement from Peter Steinberger.
22
+
23
+ > "You shouldn’t be prompting coding agents anymore. You should be designing loops that prompt your agents."
24
+
25
+ Why it matters: This is one of the clearest formulations of the human role moving from turn-by-turn prompting to loop design.
26
+
27
+ ## Boris Cherny
28
+
29
+ Source: [I Now Just Write Loops To Prompt Claude Code: Claude Code Creator Boris Cherny](https://officechai.com/ai/i-now-just-write-loops-to-prompt-claude-code-claude-code-creator-boris-cherny/)
30
+
31
+ > "Now it’s actually leveled up, I think, again, to the next wave of abstraction where I don’t prompt Claude anymore. I have loops that are running. They’re the ones that are prompting Claude and figuring out what to do. My job is to write loops."
32
+
33
+ Why it matters: This is the practical workflow claim behind the concept: the developer designs the system that prompts, evaluates, and decides what to do next.
34
+
35
+ ## Anthropic
36
+
37
+ Source: [Building effective agents](https://www.anthropic.com/engineering/building-effective-agents)
38
+
39
+ > "Consistently, the most successful implementations use simple, composable patterns rather than complex frameworks."
40
+
41
+ Why it matters: Loop Engineering should stay contract-driven and composable. The goal is not to add complexity for its own sake.
42
+
43
+ The same article also states:
44
+
45
+ > "When building applications with LLMs, we recommend finding the simplest solution possible, and only increasing complexity when needed."
46
+
47
+ Why it matters: This supports a conservative maturity path: start with explicit state and verification before adding multi-agent orchestration or production autonomy.
README.de.md ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">Beim Übersetzen helfen</a>
19
+ </p>
20
+
21
+ > Eine kuratierte, umsetzungsorientierte Liste für **Loop Engineering**: die Ebene oberhalb von Prompt Engineering, Context Engineering und Harness Engineering zum Entwerfen wiederkehrender KI-Agenten-Systeme.
22
+
23
+ Prompt Engineering verbessert, was man dem Modell sagt. Context Engineering verbessert, was das Modell sehen kann. Harness Engineering verbessert Werkzeuge, Berechtigungen, Sandboxes und Prüfungen rund um einen einzelnen Agentenlauf. **Loop Engineering liegt über allen drei Ebenen**: Es entwirft Systeme, die Agenten auslösen, überwachen, Ergebnisse prüfen, Zustand speichern und erneut laufen.
24
+
25
+ Ein Loop entdeckt Arbeit, übergibt sie an einen oder mehrere Agenten, prüft das Ergebnis, speichert Zustand, entscheidet den nächsten Schritt und läuft erneut nach Zeitplan oder bis ein überprüfbares Ziel erreicht ist.
26
+
27
+ Dieses Repository behandelt die neue Bedeutung von Loop Engineering im Kontext von KI-Agenten und Coding Agents. Es geht nicht um Software-Event-Loops, Regelungstechnik, Growth Loops, generische Automatisierung oder nicht-KI-bezogene Feedback-Loops.
28
+
29
+ ## Mentales Modell
30
+
31
+ - Prompt Engineering fragt: Was soll ich dem Modell sagen?
32
+ - Context Engineering fragt: Welchen Zustand und welches Wissen soll das Modell sehen?
33
+ - Harness Engineering fragt: Welche Werkzeuge, Berechtigungen, Tests, Sandboxes und Feedback-Signale sollen den Agenten umgeben?
34
+ - Loop Engineering fragt: Welches wiederkehrende System soll Arbeit entdecken, an Agenten delegieren, Ergebnisse prüfen, Zustand speichern, nächste Aktionen entscheiden und erneut laufen?
35
+
36
+ Prompt, Context und Harness Engineering verbessern einen einzelnen Lauf. Loop Engineering macht Agentenarbeit über Zeit wiederholbar, beobachtbar und steuerbar.
37
+
38
+ ## Loop Contract
39
+
40
+ Ein nützlicher Loop macht normalerweise diese Bestandteile sichtbar:
41
+
42
+ | Teil | Designfrage | Typisches Artefakt |
43
+ | ----------------- | ------------------------------------------------ | ----------------------------------------------------------- |
44
+ | Objective | Was soll der Loop optimieren? | Goal, issue, PRD, runbook |
45
+ | Trigger | Wann läuft der Loop? | Schedule, webhook, `/loop`, `/goal`, automation |
46
+ | Discover / Intake | Wie findet der Loop Arbeit? | GitHub query, Linear filter, CI failure, feedback stream |
47
+ | Workspace | Wo kann der Agent sicher handeln? | Worktree, sandbox, branch, container |
48
+ | Context | Welches dauerhafte Wissen wird geladen? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
49
+ | Delegation | Welcher Agent übernimmt welche Aufgabe? | Explorer, implementer, reviewer, judge |
50
+ | Verification | Was entscheidet über Erfolg oder Fehler? | Tests, typecheck, lint, evals, trace graders |
51
+ | State | Was bleibt für den nächsten Lauf erhalten? | Progress file, checkpoint, trace, issue comment |
52
+ | Budget | Wann soll der Loop aufhören zu verbrauchen? | Max turns, max retries, token budget, time box |
53
+ | Escalation | Wann übernimmt ein Mensch? | PR, issue, Slack alert, triage inbox |
54
+ | Exit | Woher weiß der Loop, dass er fertig ist? | Acceptance criteria, passing checks, no work found |
55
+
56
+ ## Reifegradmodell
57
+
58
+ | Stufe | Name | Beschreibung |
59
+ | ----- | -------------------------- | --------------------------------------------------------------------------------------------- |
60
+ | 0 | Manual prompting | Ein Mensch liest den Zustand und schreibt den nächsten Prompt. |
61
+ | 1 | Scripted retry | Ein Skript gibt Fehler an den Agenten zurück. |
62
+ | 2 | Scheduled loop | Der Agent läuft nach Zeitplan und berichtet Ergebnisse. |
63
+ | 3 | Stateful loop | Fortschritt bleibt über Dateien, Issues, Checkpoints oder Traces erhalten. |
64
+ | 4 | Self-verifying loop | Deterministische Checks oder Evaluator-Agenten blockieren falsche Abschlüsse. |
65
+ | 5 | Multi-agent loop | Spezialisierte Agenten teilen Discovery, Implementierung, Review und Urteil auf. |
66
+ | 6 | Production-supervised loop | Observability, Budgets, Freigaben, Rollback und menschliche Eskalation sind zentral. |
67
+
68
+ ## Erste Lektüre
69
+
70
+ Die vollständige Ressourcenliste bleibt im kanonischen englischen README: [README.md](README.md).
71
+
72
+ Empfohlene Einstiege:
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Direkte Definition des Wechsels von manuellem Prompting zu Systemen, die prompten, prüfen und fortsetzen.
75
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - Praktischer Leitfaden für plan-edit-test-observe-repair-document-repeat.
76
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - Offizielle Mechanik für `/loop`, geplante Aufgaben und wiederkehrende Prompts.
77
+ - [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - Komponierbare Patterns für Workflows und Agenten.
78
+
79
+ ## Beitragen
80
+
81
+ Beiträge sind willkommen. Bitte lies [CONTRIBUTING.md](CONTRIBUTING.md), bevor du einen Pull Request öffnest.
82
+
83
+ Schneller Ablauf:
84
+
85
+ 1. Prüfe, ob die Ressource Loop Engineering für KI-Agenten/Coding Agents oder eine direkte Grundlage dafür behandelt.
86
+ 1. Suche im README, um Duplikate zu vermeiden.
87
+ 1. Wähle die spezifischste Kategorie.
88
+ 1. Füge einen Eintrag in diesem Format hinzu:
89
+
90
+ ```md
91
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
92
+ ```
93
+
94
+ 1. Erkläre im PR Relevanz, Kategorie, Ressourcentyp und Nutzen für Builders.
95
+
96
+ ## Übersetzungen
97
+
98
+ Wenn du eine Sprache pflegen oder hinzufügen möchtest, lies [TRANSLATIONS.md](TRANSLATIONS.md). Übersetzungen müssen den engen Scope bewahren und dürfen Event Loops, Growth Loops oder generische Automatisierung nicht in den Umfang ziehen.
README.es.md ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">Ayudar a traducir</a>
19
+ </p>
20
+
21
+ > Una lista curada y orientada a la implementación para **Loop Engineering**: la capa por encima de prompt, context y harness engineering para diseñar sistemas recurrentes de agentes de IA.
22
+
23
+ Prompt engineering mejora lo que le pides al modelo. Context engineering mejora lo que el modelo puede ver. Harness engineering mejora las herramientas, permisos, sandboxes y verificaciones alrededor de una ejecución de agente. **Loop Engineering está por encima de las tres**: diseña sistemas que activan agentes, los supervisan, verifican resultados, guardan estado y vuelven a ejecutarse.
24
+
25
+ Un loop descubre trabajo, lo delega a uno o más agentes, verifica el resultado, registra estado, decide la siguiente acción y vuelve a ejecutarse con una cadencia o hasta alcanzar un objetivo verificable.
26
+
27
+ Este repositorio se centra en el significado nuevo de Loop Engineering para agentes de IA y coding agents. No trata sobre event loops de software, teoría de control, growth loops, automatización genérica o feedback loops no relacionados con IA.
28
+
29
+ ## Modelo Mental
30
+
31
+ - Prompt engineering pregunta: ¿qué debería decirle al modelo?
32
+ - Context engineering pregunta: ¿qué estado y conocimiento debería ver el modelo?
33
+ - Harness engineering pregunta: ¿qué herramientas, permisos, pruebas, sandboxes y feedback deberían rodear al agente?
34
+ - Loop engineering pregunta: ¿qué sistema recurrente debería descubrir trabajo, delegarlo a agentes, verificar resultados, persistir estado, decidir siguientes acciones y volver a ejecutarse?
35
+
36
+ Prompt, context y harness engineering mejoran una ejecución. Loop Engineering hace que el trabajo de agentes sea repetible, observable y gobernable en el tiempo.
37
+
38
+ ## Loop Contract
39
+
40
+ Un loop útil normalmente necesita estas partes:
41
+
42
+ | Parte | Pregunta de diseño | Artefacto común |
43
+ | ----------------- | ------------------------------------------ | ----------------------------------------------------------- |
44
+ | Objective | ¿Qué debe optimizar el loop? | Goal, issue, PRD, runbook |
45
+ | Trigger | ¿Cuándo se ejecuta? | Schedule, webhook, `/loop`, `/goal`, automation |
46
+ | Discover / Intake | ¿Cómo encuentra trabajo? | GitHub query, Linear filter, CI failure, feedback stream |
47
+ | Workspace | ¿Dónde puede actuar el agente con cuidado? | Worktree, sandbox, branch, container |
48
+ | Context | ¿Qué conocimiento durable debe cargar? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
49
+ | Delegation | ¿Qué agente hace cada parte? | Explorer, implementer, reviewer, judge |
50
+ | Verification | ¿Qué decide éxito o fallo? | Tests, typecheck, lint, evals, trace graders |
51
+ | State | ¿Qué sobrevive a la siguiente iteración? | Progress file, checkpoint, trace, issue comment |
52
+ | Budget | ¿Cuándo debe dejar de gastar? | Max turns, max retries, token budget, time box |
53
+ | Escalation | ¿Cuándo interviene una persona? | PR, issue, Slack alert, triage inbox |
54
+ | Exit | ¿Cómo sabe que terminó? | Acceptance criteria, passing checks, no work found |
55
+
56
+ ## Modelo de Madurez
57
+
58
+ | Nivel | Nombre | Descripción |
59
+ | ----- | -------------------------- | ----------------------------------------------------------------------------------------- |
60
+ | 0 | Manual prompting | Una persona lee el estado y escribe el siguiente prompt. |
61
+ | 1 | Scripted retry | Un script devuelve errores al agente. |
62
+ | 2 | Scheduled loop | El agente corre con una cadencia y reporta resultados. |
63
+ | 3 | Stateful loop | El progreso sobrevive mediante archivos, issues, checkpoints o traces. |
64
+ | 4 | Self-verifying loop | Verificaciones deterministas o evaluadores bloquean un cierre incorrecto. |
65
+ | 5 | Multi-agent loop | Agentes especializados dividen descubrimiento, implementación, revisión y juicio. |
66
+ | 6 | Production-supervised loop | Observabilidad, presupuestos, aprobaciones, rollback y escalación humana son centrales. |
67
+
68
+ ## Por Dónde Empezar
69
+
70
+ La lista completa de recursos vive en el README canónico en inglés: [README.md](README.md).
71
+
72
+ Recursos iniciales recomendados:
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Definición directa del cambio desde prompting manual hacia sistemas que prompt, verifican y continúan.
75
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - Guía práctica para ciclos plan-edit-test-observe-repair-document-repeat.
76
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - Mecánica oficial para `/loop`, tareas programadas y prompts recurrentes.
77
+ - [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - Patrones composables para workflows y agentes.
78
+
79
+ ## Contribuir
80
+
81
+ Las contribuciones son bienvenidas. Lee [CONTRIBUTING.md](CONTRIBUTING.md) antes de abrir un pull request.
82
+
83
+ Proceso rápido:
84
+
85
+ 1. Confirma que el recurso trata de Loop Engineering para agentes de IA/coding agents o de una base directa para ello.
86
+ 1. Busca en el README para evitar duplicados.
87
+ 1. Elige la categoría más específica.
88
+ 1. Añade una entrada con este formato:
89
+
90
+ ```md
91
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
92
+ ```
93
+
94
+ 1. Explica en el PR la relevancia, la categoría, el tipo de recurso y por qué ayuda a builders.
95
+
96
+ ## Traducciones
97
+
98
+ Para mantener o añadir un idioma, lee [TRANSLATIONS.md](TRANSLATIONS.md). Las traducciones deben conservar el alcance estrecho: no mezclar event loops, growth loops ni automatización genérica.
README.fr.md ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">Aider à traduire</a>
19
+ </p>
20
+
21
+ > Une liste organisée et orientée implémentation pour **Loop Engineering** : la couche au-dessus du prompt engineering, du context engineering et du harness engineering pour concevoir des systèmes récurrents d'agents IA.
22
+
23
+ Le prompt engineering améliore ce que l'on demande au modèle. Le context engineering améliore ce que le modèle peut voir. Le harness engineering améliore les outils, permissions, sandboxes et vérifications autour d'une exécution d'agent. **Loop Engineering se situe au-dessus des trois** : il conçoit des systèmes qui déclenchent des agents, les supervisent, vérifient les résultats, persistent l'état et relancent le travail.
24
+
25
+ Un loop découvre du travail, le délègue à un ou plusieurs agents, vérifie le résultat, enregistre l'état, décide de l'action suivante et se relance selon une cadence ou jusqu'à atteindre un objectif vérifiable.
26
+
27
+ Ce dépôt concerne le nouveau sens de Loop Engineering dans le contexte des agents IA et coding agents. Il ne concerne pas les event loops logiciels, la théorie du contrôle, les growth loops, l'automatisation générique ou les feedback loops non liés à l'IA.
28
+
29
+ ## Modèle Mental
30
+
31
+ - Prompt engineering demande : que faut-il dire au modèle ?
32
+ - Context engineering demande : quel état et quelles connaissances le modèle doit-il voir ?
33
+ - Harness engineering demande : quels outils, permissions, tests, sandboxes et signaux de feedback doivent entourer l'agent ?
34
+ - Loop engineering demande : quel système récurrent doit découvrir le travail, déléguer aux agents, vérifier les résultats, persister l'état, décider des prochaines actions et se relancer ?
35
+
36
+ Prompt, context et harness engineering améliorent une exécution. Loop Engineering rend le travail des agents répétable, observable et gouvernable dans le temps.
37
+
38
+ ## Loop Contract
39
+
40
+ Un loop utile rend généralement visibles ces éléments :
41
+
42
+ | Élément | Question de conception | Artefact courant |
43
+ | ----------------- | -------------------------------------------- | ----------------------------------------------------------- |
44
+ | Objective | Que doit optimiser le loop ? | Goal, issue, PRD, runbook |
45
+ | Trigger | Quand le loop s'exécute-t-il ? | Schedule, webhook, `/loop`, `/goal`, automation |
46
+ | Discover / Intake | Comment le loop trouve-t-il le travail ? | GitHub query, Linear filter, CI failure, feedback stream |
47
+ | Workspace | Où l'agent peut-il agir en sécurité ? | Worktree, sandbox, branch, container |
48
+ | Context | Quelles connaissances durables charger ? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
49
+ | Delegation | Quel agent fait quoi ? | Explorer, implementer, reviewer, judge |
50
+ | Verification | Qu'est-ce qui décide succès ou échec ? | Tests, typecheck, lint, evals, trace graders |
51
+ | State | Qu'est-ce qui survit au prochain passage ? | Progress file, checkpoint, trace, issue comment |
52
+ | Budget | Quand faut-il arrêter de consommer ? | Max turns, max retries, token budget, time box |
53
+ | Escalation | Quand une personne doit-elle reprendre ? | PR, issue, Slack alert, triage inbox |
54
+ | Exit | Comment sait-on que le loop est terminé ? | Acceptance criteria, passing checks, no work found |
55
+
56
+ ## Modèle de Maturité
57
+
58
+ | Niveau | Nom | Description |
59
+ | ------ | -------------------------- | ------------------------------------------------------------------------------------------- |
60
+ | 0 | Manual prompting | Une personne lit l'état et écrit le prompt suivant. |
61
+ | 1 | Scripted retry | Un script renvoie les erreurs à l'agent. |
62
+ | 2 | Scheduled loop | L'agent s'exécute selon une cadence et rapporte ses résultats. |
63
+ | 3 | Stateful loop | Le progrès survit via fichiers, issues, checkpoints ou traces. |
64
+ | 4 | Self-verifying loop | Des vérifications déterministes ou évaluateurs empêchent une fausse validation. |
65
+ | 5 | Multi-agent loop | Des agents spécialisés séparent découverte, implémentation, revue et jugement. |
66
+ | 6 | Production-supervised loop | Observabilité, budgets, approbations, rollback et escalade humaine sont de premier ordre. |
67
+
68
+ ## Premières Lectures
69
+
70
+ La liste complète des ressources reste dans le README canonique en anglais : [README.md](README.md).
71
+
72
+ Ressources recommandées pour commencer :
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Définition directe du passage du prompting manuel à des systèmes qui promptent, vérifient et continuent.
75
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - Guide pratique pour des cycles plan-edit-test-observe-repair-document-repeat.
76
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - Mécanismes officiels pour `/loop`, tâches planifiées et prompts récurrents.
77
+ - [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - Patterns composables pour workflows et agents.
78
+
79
+ ## Contribuer
80
+
81
+ Les contributions sont bienvenues. Lis [CONTRIBUTING.md](CONTRIBUTING.md) avant d'ouvrir une pull request.
82
+
83
+ Processus rapide :
84
+
85
+ 1. Vérifie que la ressource concerne Loop Engineering pour agents IA/coding agents ou une base directe.
86
+ 1. Recherche dans le README pour éviter les doublons.
87
+ 1. Choisis la catégorie la plus spécifique.
88
+ 1. Ajoute une entrée dans ce format :
89
+
90
+ ```md
91
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
92
+ ```
93
+
94
+ 1. Explique dans la PR la pertinence, la catégorie, le type de ressource et l'intérêt pour les builders.
95
+
96
+ ## Traductions
97
+
98
+ Pour maintenir ou ajouter une langue, lis [TRANSLATIONS.md](TRANSLATIONS.md). Les traductions doivent préserver le périmètre : ne pas inclure les event loops, growth loops ou automatisations génériques.
README.ja.md ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">翻訳に協力する</a>
19
+ </p>
20
+
21
+ > **Loop Engineering** のための、実装志向のキュレーションリストです。Loop Engineering は prompt、context、harness engineering の上位レイヤーとして、繰り返し実行される AI-agent システムを設計します。
22
+
23
+ Prompt engineering はモデルに何を依頼するかを改善します。Context engineering はモデルが何を見られるかを改善します。Harness engineering は 1 回の agent 実行を取り巻くツール、権限、sandbox、検証を改善します。**Loop Engineering はその上位にあります**。agent を起動し、監督し、結果を検証し、状態を保存し、再実行するシステムを設計する実践です。
24
+
25
+ Loop は作業を発見し、1 つ以上の agents に委任し、結果を確認し、状態を記録し、次の行動を決め、一定の cadence または検証可能な目標に到達するまで再実行されます。
26
+
27
+ このリポジトリは AI agents / coding agents における新しい意味の Loop Engineering に限定しています。software event loop、制御理論、growth loop、一般的な workflow automation、非 AI の feedback loop は対象外です。
28
+
29
+ ## メンタルモデル
30
+
31
+ - Prompt engineering: モデルに何を言うべきか?
32
+ - Context engineering: モデルはどの状態や知識を見るべきか?
33
+ - Harness engineering: agent の周囲にどのツール、権限、テスト、sandbox、feedback を置くべきか?
34
+ - Loop engineering: 人間が内側のループから離れたとき、どの反復システムが作業を発見し、agent に委任し、結果を検証し、状態を永続化し、次の行動を決め、再実行するべきか?
35
+
36
+ Prompt、context、harness engineering は 1 回の実行を良くします。Loop Engineering は agent の仕事を時間をまたいで反復可能、観測可能、統治可能にします。
37
+
38
+ ## Loop Contract
39
+
40
+ 有用な loop には通常、次の要素が必要です。
41
+
42
+ | 要素 | 設計上の問い | 一般的な成果物 |
43
+ | ----------------- | --------------------------------------------- | ----------------------------------------------------------- |
44
+ | Objective | loop は何を最適化するのか? | Goal, issue, PRD, runbook |
45
+ | Trigger | いつ実行されるのか? | Schedule, webhook, `/loop`, `/goal`, automation |
46
+ | Discover / Intake | どのように作業を発見するのか? | GitHub query, Linear filter, CI failure, feedback stream |
47
+ | Workspace | agent はどこで安全に行動できるのか? | Worktree, sandbox, branch, container |
48
+ | Context | どの永続的な知識を読み込むのか? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
49
+ | Delegation | どの agent が何を担当するのか? | Explorer, implementer, reviewer, judge |
50
+ | Verification | 何が成功または失敗を判断するのか? | Tests, typecheck, lint, evals, trace graders |
51
+ | State | 次回の実行に何を残すのか? | Progress file, checkpoint, trace, issue comment |
52
+ | Budget | いつ消費を止めるのか? | Max turns, max retries, token budget, time box |
53
+ | Escalation | いつ人間に引き継ぐのか? | PR, issue, Slack alert, triage inbox |
54
+ | Exit | loop はどう完了を判断するのか? | Acceptance criteria, passing checks, no work found |
55
+
56
+ ## 成熟度モデル
57
+
58
+ | レベル | 名称 | 説明 |
59
+ | ------ | -------------------------- | -------------------------------------------------------------------------------------------- |
60
+ | 0 | Manual prompting | 人間が状態を読み、次の prompt を書く。 |
61
+ | 1 | Scripted retry | script がエラーを agent に戻す。 |
62
+ | 2 | Scheduled loop | agent が一定の cadence で実行され、結果を報告する。 |
63
+ | 3 | Stateful loop | ファイル、issue、checkpoint、trace によって進捗が残る。 |
64
+ | 4 | Self-verifying loop | 決定的な check や evaluator agent が誤った完了を防ぐ。 |
65
+ | 5 | Multi-agent loop | 専門 agents が discovery、implementation、review、judgment を分担する。 |
66
+ | 6 | Production-supervised loop | observability、budget、approval、rollback、人間への escalation が一級の要素になる。 |
67
+
68
+ ## はじめに読むもの
69
+
70
+ 完全なリソース一覧は英語の canonical README にあります: [README.md](README.md)。
71
+
72
+ おすすめの入口:
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - 手動 prompt から、prompt・検証・継続を行うシステム設計への移行を定義します。
75
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - plan-edit-test-observe-repair-document-repeat の実践的な runbook。
76
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - `/loop`、scheduled tasks、recurring prompts の公式メカニクス。
77
+ - [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - workflow と agents の composable patterns。
78
+
79
+ ## 貢献
80
+
81
+ Pull request は歓迎です。まず [CONTRIBUTING.md](CONTRIBUTING.md) を読んでください。
82
+
83
+ 最短手順:
84
+
85
+ 1. そのリソースが AI/coding-agent 文脈の Loop Engineering、またはその直接的な基盤であることを確認する。
86
+ 1. README を検索して重複を避ける。
87
+ 1. 最も具体的なカテゴリを選ぶ。
88
+ 1. 次の形式で 1 行追加する。
89
+
90
+ ```md
91
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
92
+ ```
93
+
94
+ 1. PR で関連性、カテゴリ、リソース種別、builders にとっての価値を説明する。
95
+
96
+ ## 翻訳
97
+
98
+ 新しい言語を追加または維持したい場合は [TRANSLATIONS.md](TRANSLATIONS.md) を読んでください。翻訳では scope boundary を守り、event loop、growth loop、一般的な automation を混ぜないでください。
README.ko.md ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">번역 돕기</a>
19
+ </p>
20
+
21
+ > **Loop Engineering** 을 위한 구현 중심 큐레이션 목록입니다. Loop Engineering 은 prompt, context, harness engineering 위의 레이어로, 반복 실행되는 AI-agent 시스템을 설계합니다.
22
+
23
+ Prompt engineering 은 모델에게 무엇을 요청할지 개선합니다. Context engineering 은 모델이 무엇을 볼 수 있는지 개선합니다. Harness engineering 은 한 번의 agent 실행을 둘러싼 도구, 권한, sandbox, 검증을 개선합니다. **Loop Engineering 은 이 세 레이어 위에 있습니다**. agent 를 실행하고, 감독하고, 결과를 검증하고, 상태를 저장하고, 다시 실행하는 시스템을 설계하는 실천입니다.
24
+
25
+ Loop 는 작업을 발견하고, 하나 이상의 agents 에게 위임하고, 결과를 확인하고, 상태를 기록하고, 다음 행동을 결정한 뒤, 일정 cadence 또는 검증 가능한 목표에 도달할 때까지 다시 실행됩니다.
26
+
27
+ 이 저장소는 AI agents / coding agents 맥락의 새로운 Loop Engineering 의미에만 집중합니다. software event loop, control theory, growth loop, 일반적인 workflow automation, 비 AI feedback loop 는 범위에 포함하지 않습니다.
28
+
29
+ ## 멘탈 모델
30
+
31
+ - Prompt engineering: 모델에게 무엇을 말해야 하는가?
32
+ - Context engineering: 모델이 어떤 상태와 지식을 봐야 하는가?
33
+ - Harness engineering: agent 주변에 어떤 도구, 권한, 테스트, sandbox, feedback 이 있어야 하는가?
34
+ - Loop engineering: 사람이 내부 루프에 있지 않을 때 어떤 반복 시스템이 작업을 발견하고, agents 에게 위임하고, 결과를 검증하고, 상태를 저장하고, 다음 행동을 결정하고, 다시 실행해야 하는가?
35
+
36
+ Prompt, context, harness engineering 은 한 번의 실행을 더 좋게 만듭니다. Loop Engineering 은 agent 작업을 시간에 걸쳐 반복 가능하고, 관찰 가능하고, 거버넌스 가능하게 만듭니다.
37
+
38
+ ## Loop Contract
39
+
40
+ 유용한 loop 는 보통 다음 요소를 명확히 해야 합니다.
41
+
42
+ | 요소 | 설계 질문 | 일반적인 산출물 |
43
+ | ----------------- | ---------------------------------------------- | ----------------------------------------------------------- |
44
+ | Objective | loop 는 무엇을 최적화하는가? | Goal, issue, PRD, runbook |
45
+ | Trigger | 언제 실행되는가? | Schedule, webhook, `/loop`, `/goal`, automation |
46
+ | Discover / Intake | 어떻게 작업을 발견하는가? | GitHub query, Linear filter, CI failure, feedback stream |
47
+ | Workspace | agent 는 어디에서 안전하게 행동하는가? | Worktree, sandbox, branch, container |
48
+ | Context | 어떤 지속 지식을 로드해야 하는가? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
49
+ | Delegation | 어떤 agent 가 무엇을 담당하는가? | Explorer, implementer, reviewer, judge |
50
+ | Verification | 무엇이 성공 또는 실패를 판단하는가? | Tests, typecheck, lint, evals, trace graders |
51
+ | State | 다음 실행까지 무엇이 남아야 하는가? | Progress file, checkpoint, trace, issue comment |
52
+ | Budget | 언제 비용 소비를 멈춰야 하는가? | Max turns, max retries, token budget, time box |
53
+ | Escalation | 언제 사람이 개입해야 하는가? | PR, issue, Slack alert, triage inbox |
54
+ | Exit | loop 는 어떻게 완료를 판단하는가? | Acceptance criteria, passing checks, no work found |
55
+
56
+ ## 성숙도 모델
57
+
58
+ | 레벨 | 이름 | 설명 |
59
+ | ---- | -------------------------- | -------------------------------------------------------------------------------------------- |
60
+ | 0 | Manual prompting | 사람이 상태를 읽고 다음 prompt 를 작성합니다. |
61
+ | 1 | Scripted retry | script 가 오류를 agent 에게 다시 전달합니다. |
62
+ | 2 | Scheduled loop | agent 가 일정 cadence 로 실행되고 결과를 보고합니다. |
63
+ | 3 | Stateful loop | 파일, issue, checkpoint, trace 로 진행 상황이 유지됩니다. |
64
+ | 4 | Self-verifying loop | 결정적 check 또는 evaluator agent 가 잘못된 완료를 막습니다. |
65
+ | 5 | Multi-agent loop | 전문 agents 가 discovery, implementation, review, judgment 를 나눕니다. |
66
+ | 6 | Production-supervised loop | observability, budget, approval, rollback, human escalation 이 핵심 요소가 됩니다. |
67
+
68
+ ## 시작하기
69
+
70
+ 전체 리소스 목록은 영어 canonical README 에 있습니다: [README.md](README.md).
71
+
72
+ 추천 시작 자료:
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - 수동 prompting 에서 prompt, 검증, 지속을 수행하는 시스템 설계로 이동하는 흐름을 정의합니다.
75
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - plan-edit-test-observe-repair-document-repeat 작업을 위한 실용 runbook.
76
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - `/loop`, scheduled tasks, recurring prompts 의 공식 메커니즘.
77
+ - [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - workflows 와 agents 를 위한 composable patterns.
78
+
79
+ ## 기여하기
80
+
81
+ Pull request 를 환영합니다. 먼저 [CONTRIBUTING.md](CONTRIBUTING.md) 를 읽어 주세요.
82
+
83
+ 빠른 절차:
84
+
85
+ 1. 리소스가 AI/coding-agent 맥락의 Loop Engineering 또는 직접적인 기반인지 확인합니다.
86
+ 1. README 에서 중복 여부를 검색합니다.
87
+ 1. 가장 구체적인 카테고리를 선택합니다.
88
+ 1. 다음 형식으로 한 줄을 추가합니다.
89
+
90
+ ```md
91
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
92
+ ```
93
+
94
+ 1. PR 에서 관련성, 카테고리, 리소스 타입, builders 에게 주는 가치를 설명합니다.
95
+
96
+ ## 번역
97
+
98
+ 새 언어를 추가하거나 유지하고 싶다면 [TRANSLATIONS.md](TRANSLATIONS.md) 를 읽어 주세요. 번역은 scope boundary 를 지켜야 하며 event loop, growth loop, 일반 automation 을 범위에 섞지 않아야 합니다.
README.md ADDED
@@ -0,0 +1,623 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering [![Awesome](https://awesome.re/badge.svg)](https://github.com/sindresorhus/awesome)
2
+
3
+ <p align="center">
4
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
5
+ </p>
6
+
7
+ <p align="center">
8
+ <a href="README.md">English</a> |
9
+ <a href="README.zh-CN.md">中文</a> |
10
+ <a href="README.es.md">Español</a> |
11
+ <a href="README.fr.md">Français</a> |
12
+ <a href="README.de.md">Deutsch</a> |
13
+ <a href="README.ja.md">日本語</a> |
14
+ <a href="README.ko.md">한국어</a> |
15
+ <a href="README.pt-BR.md">Português</a> |
16
+ <a href="TRANSLATIONS.md">Help translate</a> |
17
+ <a href="https://chaoyue0307.github.io/awesome-loop-engineering/">Landing page</a>
18
+ </p>
19
+
20
+ > A curated, implementation-oriented list of resources for **Loop Engineering**: the layer above prompt, context, and harness engineering for designing recurring AI-agent systems.
21
+
22
+ Prompt engineering improves what you ask the model. Context engineering improves what the model can see. Harness engineering improves the tools, permissions, sandboxes, and checks around one agent run. **Loop Engineering sits above all three**: it is the emerging AI and coding-agent practice of moving from manually prompting agents turn by turn to designing loops that do the prompting, supervision, verification, state updates, and re-triggering for you.
23
+
24
+ A loop discovers work, hands it to one or more agents, checks the result, records state, decides what should happen next, and runs again on a cadence or until a verifiable goal is reached.
25
+
26
+ This repository is about the new AI-agent meaning of Loop Engineering. It is **not** about software event loops, control theory, growth loops, generic workflow automation, or non-AI feedback systems.
27
+
28
+ **Quick orientation for first-time visitors:**
29
+
30
+ - **What it is:** Loop Engineering is the practice of designing recurring AI-agent and coding-agent systems—how work is discovered, delegated, verified, retried, and escalated over time, not just for a single run.
31
+ - **Why it matters now:** As coding agents move from one-off prompts to background automation, the design challenge shifts from "what do I ask?" to "how does the system keep working reliably?" This list exists because no existing collection focused on that layer.
32
+ - **Who this is for:** builders of AI agents, coding agents, and orchestration systems; reliability and eval engineers; teams adding recurring agent loops to production infrastructure.
33
+ - **Where to start:** Canonical Definition, Loop Contract, Start Here, then Pattern Library.
34
+
35
+ ## Contents
36
+
37
+ - [Why This Repo Exists](#why-this-repo-exists)
38
+ - [Mental Model](#mental-model)
39
+ - [How To Use This List](#how-to-use-this-list)
40
+ - [Reading Paths](#reading-paths)
41
+ - [Choose Your Loop](#choose-your-loop)
42
+ - [Canonical Definition](#canonical-definition)
43
+ - [Concept Guides](#concept-guides)
44
+ - [Maintainer Picks](#maintainer-picks)
45
+ - [Repository Highlights](#repository-highlights)
46
+ - [Resource Type Legend](#resource-type-legend)
47
+ - [Start Here](#start-here)
48
+ - [Scope Boundary](#scope-boundary)
49
+ - [The Loop Contract](#the-loop-contract)
50
+ - [Loop Design Checklist](#loop-design-checklist)
51
+ - [Loop Maturity Model](#loop-maturity-model)
52
+ - [Core Loop Primitives](#core-loop-primitives)
53
+ - [Official Runtime Guides](#official-runtime-guides)
54
+ - [Research Foundations](#research-foundations)
55
+ - [Agent Workflow Patterns](#agent-workflow-patterns)
56
+ - [Coding-Agent Loop Systems](#coding-agent-loop-systems)
57
+ - [Verification And Feedback Gates](#verification-and-feedback-gates)
58
+ - [Securing Unattended Loops](#securing-unattended-loops)
59
+ - [State, Memory, And Context Persistence](#state-memory-and-context-persistence)
60
+ - [Orchestration And Multi-Agent Delegation](#orchestration-and-multi-agent-delegation)
61
+ - [Benchmarks And Evaluation](#benchmarks-and-evaluation)
62
+ - [Operations Playbooks](#operations-playbooks)
63
+ - [Templates And Patterns](#templates-and-patterns)
64
+ - [Examples And Schema](#examples-and-schema)
65
+ - [Community Gallery](#community-gallery)
66
+ - [Discovery And Distribution](#discovery-and-distribution)
67
+ - [Roadmap And Discussion](#roadmap-and-discussion)
68
+ - [Pattern Library](#pattern-library)
69
+ - [Critiques, Risks, And Limitations](#critiques-risks-and-limitations)
70
+ - [Adjacent Awesome Lists](#adjacent-awesome-lists)
71
+ - [Citation](#citation)
72
+
73
+ ## Why This Repo Exists
74
+
75
+ Loop Engineering is becoming a distinct craft because the leverage point is moving from better single prompts, richer context, and stronger harnesses to recurring systems that decide when and how agents should run. The best agent workflows now combine goals, state, work isolation, tool permissions, feedback gates, retries, escalation, and receipts. This list exists to make that craft easier to learn, compare, and practice without mixing it with unrelated loop concepts or generic AI-agent hype.
76
+
77
+ ## Mental Model
78
+
79
+ Prompt engineering asks: **what should I say to the model?**
80
+
81
+ Context engineering asks: **what state and knowledge should the model see?**
82
+
83
+ Harness engineering asks: **what tools, permissions, tests, sandboxes, and feedback should surround the agent?**
84
+
85
+ Loop engineering asks: **what recurring system should discover work, delegate to agents, verify results, persist state, decide next actions, and re-run when the human is no longer in the inner loop?**
86
+
87
+ Prompt, context, and harness engineering make one agent run better. Loop Engineering makes agent work repeatable, observable, and governable over time.
88
+
89
+ <p align="center">
90
+ <img src="assets/loop-engineering-stack.svg" alt="Loop Engineering stack" width="100%">
91
+ </p>
92
+
93
+ Loop shape:
94
+
95
+ ```text
96
+ Objective
97
+ -> Trigger / cadence
98
+ -> Discover / intake work
99
+ -> Delegate to agents
100
+ -> Act in an isolated workspace
101
+ -> Verify with tests, evals, traces, or reviewers
102
+ -> if failed: feed back the evidence and retry
103
+ -> if passed: persist state and decide what happens next
104
+ -> Repeat, report, open a PR, or escalate to a human
105
+ ```
106
+
107
+ <p align="center">
108
+ <img src="assets/loop-lifecycle.svg" alt="Loop Engineering lifecycle: Intake, Delegate, Act, Verify, Persist, Decide; Decide retries by feeding evidence back, escalates to a human, or exits when the goal is met" width="100%">
109
+ </p>
110
+
111
+ ## How To Use This List
112
+
113
+ Start with the first-read resources and the Loop Contract if the term is new. For implementation work, move through core primitives, runtime guides, templates, and patterns. For reliability work, focus on verification gates, state persistence, critiques, and limitations. Contributions should prefer primary sources, official docs, papers, and implementation-heavy write-ups.
114
+
115
+ ## Reading Paths
116
+
117
+ Choose a path based on your intent.
118
+
119
+ - Learn the concept: canonical definition, mental model, comparison guide, and the Loop Contract.
120
+ - Implement a loop: core primitives, official runtime guides, the pattern library, and examples.
121
+ - Improve reliability or evals: verification gates, benchmarks, critiques, and limitations.
122
+ - Contribute: the community gallery, templates, and contribution guide.
123
+
124
+ ## Choose Your Loop
125
+
126
+ Start from the problem you have, not the pattern you want. Find the pattern name below, then open its full write-up in the Pattern Library section, or compare every pattern in the [pattern matrix](patterns/MATRIX.md), which also links each one by symptom.
127
+
128
+ | When you say... | Reach for the loop |
129
+ | -------------------------------- | -------------------------- |
130
+ | "My PR is stuck" | PR babysitter |
131
+ | "CI keeps failing" | CI repair loop |
132
+ | "The docs may be stale" | Docs drift collector |
133
+ | "A deploy needs monitoring" | Deploy verifier |
134
+ | "Feedback is noisy" | Feedback clusterer |
135
+ | "Dependency updates pile up" | Dependency triage loop |
136
+ | "Agent evals regressed" | Evaluation regression loop |
137
+ | "Sensitive changes need review" | Security review loop |
138
+ | "Agent spend is rising" | Cost-control loop |
139
+ | "I need recurring bug discovery" | Bug hunting loop |
140
+ | "A change needs sign-off" | Enterprise approval loop |
141
+ | "An incident just paged" | Incident response loop |
142
+ | "A dataset keeps drifting" | Data-quality loop |
143
+ | "Release notes are a chore" | Release-note loop |
144
+ | "Model choice is ad hoc" | Model-routing loop |
145
+
146
+ Not sure which runtime should run it? See the [runtime selection guide](meta/RUNTIME_SELECTION.md).
147
+
148
+ ## Canonical Definition
149
+
150
+ **Loop Engineering** is the AI and coding-agent practice of designing recurring systems that discover work, delegate it to agents, verify results, persist state, decide next actions, and run again on a cadence, event, or until a verifiable goal is reached.
151
+
152
+ ## Concept Guides
153
+
154
+ These repository-native guides define the concept, boundaries, and practical artifacts without relying on vendor-specific terminology.
155
+
156
+ - 🧾 **Template** [Canonical Definition](DEFINITION.md) - Short definition, positioning, minimal loop test, and citation note.
157
+ - 🧾 **Template** [Loop Engineering Manifesto](MANIFESTO.md) - Concise statement of the concept, commitments, non-goals, and success standard.
158
+ - 🧾 **Template** [Loop Engineering Taxonomy](TAXONOMY.md) - Classification by trigger, intake, verification, state model, topology, and operating domain.
159
+ - ⚠️ **Critique** [Loop Engineering Anti-Patterns](ANTI-PATTERNS.md) - Common failure modes such as prompt loops with no contract, infinite retries, model self-approval, hidden state, and unsafe autonomy.
160
+ - 🧾 **Template** [Comparison Guide](COMPARISON.md) - Distinguishes Loop Engineering from prompt engineering, context engineering, harness engineering, workflow automation, agent workflows, and evaluation loops.
161
+ - 🧾 **Template** [Sourced Signals And Quotes](QUOTES.md) - Short sourced signals from linked public materials that anchor the emerging concept.
162
+ - 🧾 **Template** [Outreach Kit](meta/OUTREACH.md) - Conservative messages for inviting corrections, sources, and real-world loop patterns.
163
+
164
+ ## Maintainer Picks
165
+
166
+ - 🧾 **Template** [Maintainer Picks](MAINTAINER_PICKS.md) - Shortlist of concept, practice, reliability, and reusable artifact resources.
167
+
168
+ ## Repository Highlights
169
+
170
+ Beyond the curated list, this repository ships its own artifacts: an operational pattern library, a schema-validated loop contract for every pattern, a runnable reference loop, a community gallery, eight language entry points, a standalone landing page, and an active discussion thread for real or anonymized Loop Engineering patterns.
171
+
172
+ ## Resource Type Legend
173
+
174
+ - 📄 **Paper**: academic paper, preprint, or technical report.
175
+ - 📝 **Blog**: essay, field note, article, or practitioner write-up.
176
+ - 📚 **Docs**: official product, API, SDK, or platform documentation.
177
+ - 🧰 **Tool**: repository, framework, SDK, runtime, or implementation.
178
+ - 🧪 **Benchmark**: benchmark, eval suite, leaderboard, or evaluation dataset.
179
+ - 🔁 **Pattern**: real-world loop pattern, operational playbook, or reusable workflow.
180
+ - 🧾 **Template**: template, checklist, schema, repository guide, or contribution artifact.
181
+ - 🧭 **List**: adjacent awesome list, ecosystem map, or curated collection.
182
+ - ⚠️ **Critique**: risk analysis, limitation, caveat, or skeptical take.
183
+
184
+ ## Start Here
185
+
186
+ Direct resources about the new AI/coding-agent meaning of Loop Engineering.
187
+
188
+ - 📝 **Blog** [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Addy Osmani's framing of loop engineering as the layer above manually prompting coding agents, with concrete primitives across Codex and Claude Code.
189
+ - 📝 **Blog** [Loop Engineering](https://addyo.substack.com/p/loop-engineering) - Substack version of the same essay; useful for the original discussion trail and quotations from Peter Steinberger and Boris Cherny.
190
+ - 📝 **Blog** [Loop Engineering](https://cobusgreyling.substack.com/p/loop-engineering) - Concise explanation of the shift from prompting agents to designing loops that discover work, delegate, verify, persist, and continue.
191
+ - 📝 **Blog** [Loop Engineering: The Guide for AI Agents](https://lushbinary.com/blog/loop-engineering-ai-coding-agents-guide/) - Practical guide that breaks the pattern into automations, worktrees, skills, connectors, subagents, and state.
192
+ - 🔁 **Pattern** [Codex Loops: What Boris Cherny Gets Right About Managing Agent Work](https://www.developersdigest.tech/blog/codex-loops-boris-cherny-agent-routines) - Engineering note on recurring agent loops for PR babysitting, CI repair, deploy verification, and feedback clustering.
193
+ - 📝 **Blog** [I Now Just Write Loops To Prompt Claude Code: Claude Code Creator Boris Cherny](https://officechai.com/ai/i-now-just-write-loops-to-prompt-claude-code-claude-code-creator-boris-cherny/) - Coverage of Boris Cherny's "my job is to write loops" workflow.
194
+ - 📝 **Blog** [My Lord! AI Programming Undergoes Another Major Shift](https://eu.36kr.com/en/p/3844224911346184) - Broad coverage of the Boris Cherny and Peter Steinberger discussion, including the distinction between cold-start scripts and persistent agent loops.
195
+ - 📝 **Blog** [Peter Steinberger on designing loops](https://x.com/steipete/status/2063697162748260627) - The June 2026 post - "you shouldn't be prompting coding agents anymore, you should be designing loops that prompt your agents" - that catalyzed the current discussion.
196
+ - 📝 **Blog** [The Anthropic leader who built Claude Code ditched prompting - now he writes loops](https://thenewstack.io/loop-engineering/) - The New Stack's report on Boris Cherny's shift from prompting to loop writing and what it changes about developer workflow.
197
+ - 📝 **Blog** [Stop Prompting. Design the Loop.](https://www.pulumi.com/blog/stop-prompting-design-the-loop/) - Practical breakdown of loop building blocks - automations, worktrees, skills, connectors, subagents - plus external memory and verification through oracles such as tests and builds.
198
+ - 📝 **Blog** [Boris Cherny: five tips for running Opus autonomously for hours or days](https://x.com/bcherny/status/2063792263067754658) - The Claude Code creator's compact loop recipe: auto-mode permissions, dynamic workflows, `/goal` or `/loop`, the cloud runner, and end-to-end self-verification.
199
+
200
+ ## Scope Boundary
201
+
202
+ | In scope | Out of scope |
203
+ | ------------------------------------------------------------------------------------------------------------------- | --------------------------------------------------------------- |
204
+ | AI/coding-agent loops that coordinate prompts, context, harnesses, verification, and state over repeated agent runs | Software event loops, UI/game loops, or control theory loops |
205
+ | Scheduled, goal-driven, or event-triggered agent work | Generic cron jobs with no agentic reasoning or verification |
206
+ | Agent loops with durable state, worktrees, checkpoints, traces, or progress files | One-off prompt examples with no loop, state, or feedback signal |
207
+ | Verification loops using tests, CI, evals, reviewers, or deterministic gates | Pure AI news, generic product pages, or marketing copy |
208
+ | Multi-agent maker/checker/delegation patterns | Broad agent lists without specific loop-design relevance |
209
+
210
+ ## The Loop Contract
211
+
212
+ A useful loop has a contract. If one of these is missing, the loop usually becomes either a manual prompt habit or an unsafe background automation. Prompt, context, and harness choices are ingredients; the loop contract is the operating layer that connects them over time.
213
+
214
+ <p align="center">
215
+ <img src="assets/loop-contract-cards.svg" alt="Loop Contract cards" width="100%">
216
+ </p>
217
+
218
+ | Part | Design question | Common artifact |
219
+ | ----------------- | -------------------------------------- | ------------------------------------------------------------ |
220
+ | Objective | What should the loop optimize for? | Goal, issue, PRD, runbook |
221
+ | Trigger | When does the loop run? | Schedule, webhook, `/loop`, `/goal`, automation |
222
+ | Discover / Intake | How does the loop find work? | GitHub queries, Linear filters, CI failures, feedback stream |
223
+ | Workspace | Where can the agent act safely? | Worktree, sandbox, branch, container |
224
+ | Context | What durable knowledge should it load? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
225
+ | Delegation | Which agent does which job? | Explorer, implementer, reviewer, judge |
226
+ | Verification | What says "yes" or "no"? | Tests, typecheck, lint, evals, trace graders |
227
+ | State | What survives the next run? | Progress file, database checkpoint, trace, issue comment |
228
+ | Budget | When should it stop spending? | Max turns, max retries, token budget, time box |
229
+ | Escalation | When does a human take over? | PR, issue, Slack alert, triage inbox |
230
+ | Exit | How does the loop know it is done? | Acceptance criteria, passing checks, no work found |
231
+
232
+ Good loop documentation should make the contract visible. A reader should be able to tell what triggers the loop, what state it reads, what it is allowed to change, how it verifies progress, and when it stops.
233
+
234
+ ## Loop Design Checklist
235
+
236
+ | Check | Question |
237
+ | ------------------------------- | ---------------------------------------------------------------------------------------------------- |
238
+ | Name one objective | Does the loop optimize for a specific outcome instead of a vague goal such as "improve the repo"? |
239
+ | Define the intake | Where does work enter: PR comments, CI failures, issues, logs, eval failures, feedback, or schedule? |
240
+ | Isolate execution | Does the agent act in a worktree, sandbox, branch, container, or read-only mode? |
241
+ | Write the feedback signal first | Do tests, typechecks, lint, evals, policy checks, or trace graders exist before retries begin? |
242
+ | Persist state outside the model | Does progress survive in files, issue comments, checkpoints, traces, or a database? |
243
+ | Separate maker and checker | Does something other than the acting agent decide whether the work is done? |
244
+ | Put a budget on autonomy | Are runtime, turns, retries, token spend, and concurrent workers capped? |
245
+ | Design escalation | Is it clear when the loop should open a PR, file an issue, ask a human, or stop? |
246
+ | Keep receipts | Are commands, evidence, changed files, and stop reasons recorded? |
247
+
248
+ ## Loop Maturity Model
249
+
250
+ | Level | Name | Description |
251
+ | ----- | -------------------------- | ---------------------------------------------------------------------------------- |
252
+ | 0 | Manual prompting | A human reads state and writes the next prompt. |
253
+ | 1 | Scripted retry | A shell/script loop feeds errors back to an agent. |
254
+ | 2 | Scheduled loop | The agent runs on a cadence and reports findings. |
255
+ | 3 | Stateful loop | Progress survives across sessions through files, issues, checkpoints, or traces. |
256
+ | 4 | Self-verifying loop | Deterministic checks or evaluator agents gate completion. |
257
+ | 5 | Multi-agent loop | Specialized agents split discovery, implementation, review, and judgment. |
258
+ | 6 | Production-supervised loop | Observability, budgets, approvals, rollback, and human escalation are first-class. |
259
+
260
+ Most teams should climb this model slowly. A reliable Level 3 loop with clear state and deterministic checks is usually more valuable than a flashy Level 5 loop with vague goals.
261
+
262
+ ## Core Loop Primitives
263
+
264
+ These are the building blocks that make a loop more than a repeated prompt.
265
+
266
+ - 📚 **Docs** [Automations - Codex app](https://developers.openai.com/codex/app/automations) - Codex background automations for recurring tasks, triage inboxes, skills, and worktree isolation.
267
+ - 📚 **Docs** [Follow a goal - Codex use cases](https://developers.openai.com/codex/use-cases/follow-goals) - Official guidance for durable objectives with stopping conditions, validation commands, checkpoints, and progress logs.
268
+ - 📚 **Docs** [Worktrees - Codex app](https://developers.openai.com/codex/app/worktrees) - Codex worktree model for isolated parallel tasks and handoffs between local and background workspaces.
269
+ - 📚 **Docs** [Prompting - Codex](https://developers.openai.com/codex/prompting) - Explains the Codex loop, threads, context, and `/goal` mode.
270
+ - 📚 **Docs** [Customization - Codex](https://developers.openai.com/codex/concepts/customization) - Maps `AGENTS.md`, memories, skills, MCP, and subagents into a coherent customization stack.
271
+ - 📚 **Docs** [Agent Skills - Codex](https://developers.openai.com/codex/skills) - Official skill format for reusable workflows, scripts, MCP dependencies, invocation policy, and plugin packaging.
272
+ - 📚 **Docs** [Plugins - Codex](https://developers.openai.com/codex/plugins) - Bundles skills, app integrations, and MCP servers into reusable loop capabilities.
273
+ - 📚 **Docs** [Slash commands in Codex CLI](https://developers.openai.com/codex/cli/slash-commands) - CLI commands for switching agent threads, browsing skills, inspecting MCP tools, and using subagent workflows.
274
+ - 🔁 **Pattern** [Autonomous Loops](https://claudecodeguide.dev/docs/patterns/autonomous-loops) - Claude Code pattern using task files, stop hooks, restart behavior, hard limits, and a kill switch.
275
+ - 📚 **Docs** [Claude Code Glossary](https://code.claude.com/docs/en/glossary.md) - Defines the agentic loop, hooks, subagents, skills, MCP, and related primitives in Claude Code terminology.
276
+ - 📚 **Docs** [Keep Claude working toward a goal](https://code.claude.com/docs/en/goal) - `/goal` runs turn after turn until a completion condition is met by a verifier.
277
+ - 📚 **Docs** [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - `/loop`, scheduled tasks, reminders, monitor tools, and session-scoped recurring prompts.
278
+ - 📚 **Docs** [Automate work with routines](https://code.claude.com/docs/en/routines) - Claude Code routines: persistent cloud automations triggered by schedules, API calls, or GitHub events, with connectors, scoped environments, and branch-push limits.
279
+ - 📚 **Docs** [Desktop scheduled tasks](https://code.claude.com/docs/en/desktop-scheduled-tasks) - Local recurring runs on your own machine, with the persistence, file-access, permission, worktree, and missed-run trade-offs that distinguish them from `/loop` and cloud routines.
280
+ - 📚 **Docs** [Run parallel sessions with worktrees](https://code.claude.com/docs/en/worktrees) - Worktree isolation for parallel sessions and subagents so concurrent edits do not collide.
281
+ - 📚 **Docs** [Automate actions with hooks](https://code.claude.com/docs/en/hooks-guide) - Claude Code hooks guide for deterministic lifecycle control around model actions.
282
+ - 📚 **Docs** [Hooks reference](https://code.claude.com/docs/en/hooks.md) - Event-level reference for session, turn, tool-call, and subagent hooks.
283
+ - 📚 **Docs** [Common workflows - Claude Code](https://code.claude.com/docs/en/common-workflows) - Practical workflows for worktrees, subagents, CI, batch processing, planning, and resuming prior work.
284
+ - 📚 **Docs** [Manage multiple agents with agent view](https://code.claude.com/docs/en/agent-view.md) - Dashboard for dispatching, monitoring, and attaching to background agent sessions.
285
+ - 📚 **Docs** [Run agents in parallel](https://code.claude.com/docs/en/agents.md) - Compares agent view, subagents, agent teams, worktrees, tasks, and workflows for parallel work.
286
+ - 📚 **Docs** [Orchestrate subagents at scale with dynamic workflows](https://code.claude.com/docs/en/workflows) - Moves loop state and branching into workflow scripts so large tasks do not overload the conversation context.
287
+ - 📚 **Docs** [Create plugins](https://code.claude.com/docs/en/plugins) - Packaging model-invoked skills, agents, hooks, MCP servers, monitors, and settings as shareable loop components.
288
+ - 📚 **Docs** [Model Context Protocol](https://modelcontextprotocol.io/docs/getting-started/intro) - Standard protocol for exposing tools and data sources to agent loops.
289
+ - 📚 **Docs** [Allowing GitHub Copilot CLI to work autonomously](https://docs.github.com/en/copilot/concepts/agents/copilot-cli/autopilot) - Copilot CLI autopilot mode plus `/every` and `/after` scheduling, turning the CLI into an unattended loop that runs steps until a task is complete.
290
+
291
+ ## Official Runtime Guides
292
+
293
+ Primary-source docs from agent runtime vendors and framework builders.
294
+
295
+ - 📚 **Docs** [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - OpenAI's runbook for plan-edit-test-observe-repair-document-repeat work, including specs, plans, status logs, and validation gates.
296
+ - 📚 **Docs** [Best practices - Codex](https://developers.openai.com/codex/learn/best-practices) - Official best practices for context, `AGENTS.md`, MCP, skills, subagents, and automations.
297
+ - 📚 **Docs** [Agents SDK](https://developers.openai.com/api/docs/guides/agents) - OpenAI guide for agent orchestration, tool execution, approvals, state, guardrails, and observability.
298
+ - 📚 **Docs** [Agents - OpenAI Agents SDK](https://openai.github.io/openai-agents-python/agents/) - SDK primitives for agents, tools, handoffs, guardrails, and runner-managed loops.
299
+ - 📚 **Docs** [Running agents](https://developers.openai.com/api/docs/guides/agents/running-agents) - OpenAI guide to turns, state, approvals, sessions, and continuation in the SDK runtime loop.
300
+ - 📚 **Docs** [Integrations and observability](https://developers.openai.com/api/docs/guides/agents/integrations-observability) - OpenAI guide to MCP wiring and traces as the basis for debugging and evaluation loops.
301
+ - 📚 **Docs** [Sandbox Agents](https://developers.openai.com/api/docs/guides/agents/sandboxes) - Splits the harness control plane from the sandbox execution plane for long-running file and command work.
302
+ - 📚 **Docs** [Guardrails and human review](https://developers.openai.com/api/docs/guides/agents/guardrails-approvals) - Approval and validation boundaries for sensitive agent actions.
303
+ - 📚 **Docs** [Building agents with the Claude Agent SDK](https://code.claude.com/docs/en/agent-sdk/overview.md) - Claude SDK overview for tool-using agents, subagents, state, permissions, and streaming.
304
+ - 📚 **Docs** [How the agent loop works](https://code.claude.com/docs/en/agent-sdk/agent-loop) - Official walkthrough of the inner agent loop that outer recurring loops build on.
305
+ - 📚 **Docs** [Extend Claude with skills](https://code.claude.com/docs/en/skills) - Claude Code skill system for reusable loop instructions and assets.
306
+ - 📚 **Docs** [Create custom subagents](https://code.claude.com/docs/en/sub-agents) - Claude Code custom subagents with isolated context, model choice, and tool permissions.
307
+ - 📚 **Docs** [GitHub Agentic Workflows](https://github.github.com/gh-aw/) - Repository automation that runs coding agents in GitHub Actions on events or schedules with guardrails.
308
+ - 📝 **Blog** [GitHub Agentic Workflows technical preview](https://github.blog/changelog/2026-02-13-github-agentic-workflows-are-now-in-technical-preview/) - Changelog announcement for Markdown-defined agentic workflows in GitHub Actions.
309
+ - 📚 **Docs** [Continuous AI](https://githubnext.com/projects/continuous-ai/) - GitHub Next's umbrella framing for CI/CD-style AI automation across the software lifecycle, the category that agentic workflows demonstrate.
310
+ - 📝 **Blog** [Automate repository tasks with GitHub Agentic Workflows](https://github.blog/ai-and-ml/automate-repository-tasks-with-github-agentic-workflows/) - Official walkthrough of writing Markdown-defined agentic workflows with guardrails for triage, QA, and docs chores.
311
+ - 📝 **Blog** [Continuous AI in practice: What developers can automate today with agentic CI](https://github.blog/ai-and-ml/generative-ai/continuous-ai-in-practice-what-developers-can-automate-today-with-agentic-ci/) - Concrete agentic-CI automations available today, with recurring patterns for triage, review, and documentation upkeep.
312
+ - 📚 **Docs** [About GitHub Copilot coding agent](https://docs.github.com/en/copilot/concepts/agents/coding-agent/about-coding-agent) - GitHub's autonomous coding agent: assign an issue, the agent works in an isolated Actions-powered workspace, and a reviewable pull request comes back.
313
+ - 📝 **Blog** [GitHub Copilot: Meet the new coding agent](https://github.blog/news-insights/product-news/github-copilot-meet-the-new-coding-agent/) - Launch overview of the issue-to-PR delegation loop, including iteration on review feedback.
314
+ - 📚 **Docs** [Jules](https://jules.google/docs) - Google's asynchronous coding agent that plans, executes tasks in isolated cloud VMs, and returns reviewable diffs.
315
+ - 📚 **Docs** [Cursor cloud agents](https://cursor.com/docs/cloud-agent) - Remote agents that work asynchronously in isolated environments and hand results back for review.
316
+ - 📚 **Docs** [Devin Docs](https://docs.devin.ai/get-started/devin-intro) - Documentation for a long-running autonomous software engineer with sessions, playbooks, knowledge, and review boundaries.
317
+ - 📚 **Docs** [Writing effective tools for AI agents](https://www.anthropic.com/engineering/writing-tools-for-agents) - Anthropic's guidance on evaluating and improving tool specs using agentic loops and realistic tasks.
318
+ - 📚 **Docs** [Introducing advanced tool use on the Claude Developer Platform](https://www.anthropic.com/engineering/advanced-tool-use?e45d281a_page=3) - Tool search, programmatic tool calling, and tool-use examples for scaling large tool libraries without flooding context.
319
+ - 📚 **Docs** [Effective harnesses for long-running agents](https://www.anthropic.com/engineering/effective-harnesses-for-long-running-agents) - Anthropic's guidance for agents that work across many context windows: durable progress artifacts, environment setup, and self-verification.
320
+ - 📚 **Docs** [Claude Code best practices](https://code.claude.com/docs/en/best-practices) - Widely cited workflow guidance that underlies many recurring Claude Code loops.
321
+
322
+ ## Research Foundations
323
+
324
+ Loop Engineering is new as a practice name, but it builds on years of agent-loop, feedback, planning, and self-correction research.
325
+
326
+ - 📄 **Paper** [ReAct: Synergizing Reasoning and Acting in Language Models](https://arxiv.org/abs/2210.03629) - Foundational reason-act-observe loop for tool-using language agents.
327
+ - 📄 **Paper** [Reflexion: Language Agents with Verbal Reinforcement Learning](https://arxiv.org/abs/2303.11366) - Converts environment feedback into written reflections stored in memory for future attempts.
328
+ - 📄 **Paper** [Self-Refine: Iterative Refinement with Self-Feedback](https://arxiv.org/abs/2303.17651) - Generate-feedback-refine loop where a model improves outputs over repeated passes.
329
+ - 📄 **Paper** [CRITIC: Large Language Models Can Self-Correct with Tool-Interactive Critiquing](https://arxiv.org/abs/2305.11738) - Uses tools to ground critique and correction rather than relying only on introspection.
330
+ - 📄 **Paper** [Tree of Thoughts](https://arxiv.org/abs/2305.10601) - Search over multiple reasoning branches; relevant when loop design needs exploration before committing.
331
+ - 📄 **Paper** [Graph of Thoughts](https://arxiv.org/abs/2308.09687) - Generalizes thought structures beyond chains and trees, useful for complex loop planning and aggregation.
332
+ - 📄 **Paper** [Language Agent Tree Search Unifies Reasoning Acting and Planning in Language Models](https://arxiv.org/abs/2310.04406) - Combines search, action, and environment feedback for language agents.
333
+ - 📄 **Paper** [Voyager: An Open-Ended Embodied Agent with Large Language Models](https://arxiv.org/abs/2305.16291) - Demonstrates lifelong skill acquisition through iterative exploration, feedback, and a skill library.
334
+ - 📄 **Paper** [Generative Agents: Interactive Simulacra of Human Behavior](https://arxiv.org/abs/2304.03442) - Introduces reflection and memory mechanisms for long-running agent behavior.
335
+ - 📄 **Paper** [Measuring AI Ability to Complete Long Software Tasks](https://arxiv.org/abs/2503.14499) - METR's task-length time horizon metric; grounds why loop budgets, checkpoints, and escalation matter as autonomous work gets longer.
336
+ - 📝 **Blog** [Measuring AI Ability to Complete Long Tasks](https://metr.org/blog/2025-03-19-measuring-ai-ability-to-complete-long-tasks/) - Accessible summary of the 50% task-completion time horizon and its doubling trend.
337
+ - 📄 **Paper** [Reflection-Driven Control for Trustworthy Code Agents](https://arxiv.org/abs/2512.21354) - Elevates reflection from an external pass to an internal control loop that monitors the agent's decision path during generation and constrains risky steps with low overhead.
338
+ - 📄 **Paper** [PARC: An Autonomous Self-Reflective Coding Agent for Robust Execution of Long-Horizon Tasks](https://arxiv.org/abs/2512.03549) - Hierarchical plan-execute-assess loops that detect and correct strategic errors during multi-hour autonomous runs.
339
+ - 📄 **Paper** [When the Specification Emerges: Benchmarking Faithfulness Loss in Long-Horizon Coding Agents](https://arxiv.org/abs/2603.17104) - Measures how agents drift from intent when specifications arrive incrementally across a long loop, and proposes a mitigation that recovers most of the loss.
340
+ - 🧰 **Tool** [Reflexion code](https://github.com/noahshinn/reflexion) - Reference implementation and experiments for verbal reinforcement loops.
341
+
342
+ ## Agent Workflow Patterns
343
+
344
+ These resources are included when they help design the higher-level loop around agents, not merely because they describe agents in general.
345
+
346
+ - 📚 **Docs** [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - Anthropic's canonical guide to workflows and agents, including evaluator-optimizer and orchestrator-workers patterns.
347
+ - 📝 **Blog** [How we built our multi-agent research system](https://www.anthropic.com/engineering/multi-agent-research-system) - Detailed orchestrator-worker system with planning, memory, subagents, citation passes, and iterative research loops.
348
+ - 📄 **Paper** [Building Effective AI Agents: Architecture Patterns and Implementation Frameworks](https://resources.anthropic.com/hubfs/Building%20Effective%20AI%20Agents-%20Architecture%20Patterns%20and%20Implementation%20Frameworks.pdf) - PDF overview of agent architecture patterns, including generator-evaluator loops.
349
+ - 📝 **Blog** [AI Agent Architectures](https://hld.handbook.academy/curriculum/ai-ml-system-design/ai-agent-architectures/) - System-design overview of ReAct, reflection, planning, tool use, memory, and control strategies.
350
+ - 📝 **Blog** [What Are Agentic Workflows?](https://weaviate.io/blog/what-are-agentic-workflows) - Accessible taxonomy of planning, tool use, reflection, and memory patterns.
351
+ - 📝 **Blog** [Agent Planning & Reflection Patterns](https://learnaivisually.com/tracks/ai-agents/planning-reflection) - Visual explanation of plan-execute, observe, reflect, retry, and stop patterns.
352
+ - 📝 **Blog** [Agentic Design Patterns](https://addyosmani.com/agents/04-agentic-design-patterns/) - Practical overview of ReAct, reflection, tool use, planning, and how to combine them in real-world agents.
353
+ - 🔁 **Pattern** [12 Factor Agents](https://github.com/humanlayer/12-factor-agents) - Operating principles for production agents, including explicit prompts, state ownership, and pause-resume behavior.
354
+ - 🔁 **Pattern** [Durable Execution for Agentic Workflows](https://arizenai.com/durable-execution/) - Explains checkpointing, event-sourced journals, replay, and recovery for long-running agent workflows.
355
+
356
+ ## Coding-Agent Loop Systems
357
+
358
+ - 🧰 **Tool** [SWE-agent](https://github.com/SWE-agent/SWE-agent) - Agent-computer interface and autonomous software engineering agent for repository tasks.
359
+ - 📄 **Paper** [SWE-agent: Agent-Computer Interfaces Enable Automated Software Engineering](https://arxiv.org/abs/2405.15793) - Paper behind SWE-agent and its interface design.
360
+ - 🧰 **Tool** [mini-SWE-agent](https://mini-swe-agent.com/latest/) - Minimal coding agent that is useful for understanding the core loop without a large framework.
361
+ - 🧰 **Tool** [OpenHands](https://github.com/All-Hands-AI/OpenHands) - Open platform for AI software developers as generalist agents.
362
+ - 📄 **Paper** [OpenHands: An Open Platform for AI Software Developers as Generalist Agents](https://arxiv.org/abs/2407.16741) - Paper describing OpenHands, CodeActAgent, benchmarks, and generalist agent evaluation.
363
+ - 🧰 **Tool** [Agentless](https://github.com/OpenAutoCoder/Agentless) - Workflow-based approach for software issue resolution using localization, repair, and patch validation.
364
+ - 📄 **Paper** [Agentless: Demystifying LLM-based Software Engineering Agents](https://arxiv.org/abs/2407.01489) - Useful contrast case: strong results through structured workflow rather than a fully open-ended agent.
365
+ - 🧰 **Tool** [AutoCodeRover](https://github.com/AutoCodeRoverSG/auto-code-rover) - Autonomous program improvement system for issue localization, patch generation, and validation.
366
+ - 📄 **Paper** [AutoCodeRover: Autonomous Program Improvement](https://arxiv.org/abs/2404.05427) - Paper on autonomous code repair loops over real repositories.
367
+ - 🔁 **Pattern** [Ralph](https://ghuntley.com/ralph/) - Geoffrey Huntley's original Ralph technique: run one agent in a bare loop with fresh context per iteration and the filesystem plus specs as memory.
368
+ - 🔁 **Pattern** [everything is a ralph loop](https://ghuntley.com/loop/) - Follow-up essay arguing the loop, not the agent, is the durable engineering unit: one task per iteration, deterministic context, and verification inside the loop.
369
+ - 🧰 **Tool** [how-to-ralph-wiggum](https://github.com/ghuntley/how-to-ralph-wiggum) - Reference repository documenting the Ralph Wiggum technique end to end, from the bare loop script to guardrails and conventions.
370
+ - 📝 **Blog** [A Brief History of Ralph](https://www.humanlayer.dev/blog/brief-history-of-ralph) - Traces how the bare-loop technique spread from a provocation to a production practice among early adopters.
371
+ - 🔁 **Pattern** [Ralph Copilot](https://github.com/giocaizzi/ralph-copilot/tree/e5b2813cc876c73a8c9d3398c0115da0d15f63cf) - Language-agnostic Ralph loop implementation using fresh context, filesystem memory, `PRD.md`, and `PROGRESS.md`.
372
+ - 🔁 **Pattern** [Compound Engineering](https://every.to/guides/compound-engineering) - Every's named plan-work-review-compound loop, where each run feeds lessons back into `AGENTS.md`-style memory so the next loop is easier; the self-improving counterpart to Ralph.
373
+ - 🧰 **Tool** [Gas Town](https://github.com/steveyegge/gastown) - Steve Yegge's multi-agent orchestrator that runs 20-30 parallel coding agents with coordinator, worker, and merge-queue roles; the structured-orchestration end of the spectrum that Ralph anchors with bare iteration.
374
+ - 🧰 **Tool** [Amp](https://ampcode.com/) - Agentic coding tool built around threads, subagents, and an opinionated harness, with an owner's manual that documents loop-style operating practices.
375
+ - 🧰 **Tool** [karl](https://github.com/kayoslab/karl) - Autonomous multi-agent development loop with planner, reviewer, architect, tester, developer, deployment, and retry phases.
376
+ - 🔁 **Pattern** [joelclaw agent-loop skill](https://github.com/joelhooks/joelclaw/blob/main/skills/agent-loop/SKILL.md) - Durable Planner-Implementor-Reviewer-Judge coding loops via Inngest events and progress files.
377
+ - 🧭 **List** [SWE-bench reading list](https://github.com/SWE-bench/reading-list) - Maintained map of software engineering agent systems and related papers.
378
+
379
+ ## Verification And Feedback Gates
380
+
381
+ These resources include harness and observability mechanisms that loops compose into exit gates, receipts, and retry signals.
382
+
383
+ - 📝 **Blog** [Why Agentic Systems Must Produce Deterministic Outputs to Scale](https://streamzero.com/blog/posts/deep-dives-tools-technologies-architectures/agentic-patterns/why-agentic-systems-must-produce-deterministic-outputs-to-scale) - Argues for deterministic boundaries, contracts, and execution gates around probabilistic agent reasoning.
384
+ - 🔁 **Pattern** [Stop Babysitting Your Coding Agent. Give It Backpressure.](https://generativeprogrammer.com/p/stop-babysitting-your-coding-agent) - Explains how to turn tests, linters, builds, traces, and other signals into feedback loops for coding agents.
385
+ - 🔁 **Pattern** [How to Build a Self-Verification Loop in Claude Code](https://dev.to/shipwithaiio/how-to-build-a-self-verification-loop-in-claude-code-3-layers-20-minutes-m1p) - Uses hooks to enforce syntax, intent, and regression checks before an agent can finish.
386
+ - 📝 **Blog** [How to build a better agent harness with traces and evals](https://arize.com/blog/improve-ai-agents-traces-evals-harness/) - Trace-evaluate-debug-refine loop for improving agent behavior from real runs.
387
+ - 📝 **Blog** [Better Harness: A Recipe for Harness Hill-Climbing with Evals](https://www.langchain.com/blog/better-harness-a-recipe-for-harness-hill-climbing-with-evals) - LangChain's recipe for using evals as the learning signal for harness improvement.
388
+ - 📝 **Blog** [Improving Deep Agents with harness engineering](https://www.langchain.com/blog/improving-deep-agents-with-harness-engineering) - Practical discussion of self-verification, traces, middleware, and loop detection for coding agents.
389
+ - 📚 **Docs** [OpenAI agent evals](https://developers.openai.com/api/docs/guides/agent-evals) - Evaluation guidance for moving from traces to repeatable grading of agent workflows.
390
+ - 🧰 **Tool** [Promptfoo OpenAI Agents provider](https://www.promptfoo.dev/docs/providers/openai-agents/) - Testing and assertions for multi-turn agent workflows, tools, state, handoffs, sandboxes, and traces.
391
+ - 🧰 **Tool** [Inspect AI](https://github.com/UKGovernmentBEIS/inspect_ai) - UK AISI evaluation framework with solvers, scorers, sandboxing, tool use, MCP, and log viewing.
392
+ - 📚 **Docs** [OpenTelemetry Semantic Conventions for Generative AI Systems](https://opentelemetry.io/docs/specs/semconv/gen-ai/) - Portable tracing conventions for model calls, tool calls, and agent workflows.
393
+ - 🧰 **Tool** [AgentOps](https://github.com/AgentOps-AI/agentops) - Monitoring, replay, cost tracking, benchmarking, and tracing for agent sessions.
394
+ - 🧰 **Tool** [Langfuse](https://github.com/langfuse/langfuse) - Open-source LLM engineering platform with tracing, evaluations, and metrics that loops can read back as feedback signals.
395
+ - 🧰 **Tool** [LangSmith](https://www.langchain.com/langsmith) - Tracing, evaluation, and monitoring platform for inspecting and grading agent runs across iterations.
396
+ - 🧰 **Tool** [Arize Phoenix](https://github.com/Arize-ai/phoenix) - Open-source AI observability for tracing, evaluating, and debugging agent behavior from real runs.
397
+ - 🧰 **Tool** [Braintrust](https://www.braintrust.dev/) - Evaluation and observability platform with experiments, datasets, and CI integration for gating agent changes.
398
+ - 🧰 **Tool** [Weave](https://docs.wandb.ai/weave) - Weights & Biases toolkit for tracing, evaluating, and monitoring agent applications over time.
399
+ - 📄 **Paper** [Agentic Verification of Software Systems](https://arxiv.org/abs/2511.17330) - Pairs a coding agent with a theorem prover (AutoRocq) in a generate-and-validate loop, turning formal proof into the exit gate for trusted automatic programming.
400
+
401
+ ## Securing Unattended Loops
402
+
403
+ A loop that runs while nobody watches needs stronger boundaries than an interactive session. These resources cover the main risks: untrusted intake content, over-broad permissions, and unsandboxed execution.
404
+
405
+ - ⚠️ **Critique** [The lethal trifecta for AI agents](https://simonwillison.net/2025/Jun/16/the-lethal-trifecta/) - Simon Willison's rule of thumb: private data, untrusted content, and an exfiltration channel must never meet inside one unattended agent.
406
+ - ⚠️ **Critique** [Prompt injection series](https://simonwillison.net/series/prompt-injection/) - Ongoing series on the core unsolved vulnerability for loops whose intake includes content written by strangers.
407
+ - 📚 **Docs** [Agentic AI - Threats and Mitigations](https://genai.owasp.org/resource/agentic-ai-threats-and-mitigations/) - OWASP threat model for agentic systems, useful when reviewing intake, memory, tool, and delegation boundaries.
408
+ - 🧰 **Tool** [sandbox-runtime](https://github.com/anthropic-experimental/sandbox-runtime) - Anthropic's OS-level filesystem and network sandboxing for arbitrary processes without requiring a container.
409
+ - 🧰 **Tool** [E2B](https://github.com/e2b-dev/E2B) - Open-source isolated cloud sandboxes for running untrusted, AI-generated code inside agent loops.
410
+ - 📚 **Docs** [Modal Sandboxes](https://modal.com/docs/guide/sandboxes) - Secure sandboxed execution for agent-driven code with resource limits and network controls.
411
+ - 🧰 **Tool** [Daytona](https://www.daytona.io/) - Infrastructure for running AI-generated code in fast, isolated sandboxes.
412
+
413
+ ## State, Memory, And Context Persistence
414
+
415
+ This section focuses on durable loop state and cross-run context. For context-window design as its own lower layer, see the adjacent Context Engineering lists.
416
+
417
+ - 📚 **Docs** [Effective Context Engineering for AI Agents](https://www.anthropic.com/engineering/effective-context-engineering-for-ai-agents) - Anthropic guide to context as managed runtime state rather than a prompt dump.
418
+ - 📝 **Blog** [Agent Harnesses: the Infrastructure Layer Your LLM Agent Actually Needs](https://ninadpathak.com/blog/agent-harnesses/) - Covers execution loops, state, checkpointing, observers, and replayability.
419
+ - 📝 **Blog** [The Agent Loop Is the New OS](https://www.harness.io/blog/agent-loop-new-os) - Frames the agent loop as an OS-like boundary with context as RAM and tools as I/O.
420
+ - 📝 **Blog** [Harness engineering for coding agent users](https://martinfowler.com/articles/harness-engineering.html) - Martin Fowler article on feedforward, feedback, and outer harnesses for coding agents.
421
+ - 📝 **Blog** [Context Engineering](https://simonwillison.net/2025/Jun/27/context-engineering/) - Simon Willison's framing of context engineering, useful for distinguishing context state from loop orchestration.
422
+ - 📝 **Blog** [Agentic Coding in 2026](https://sourcegraph.com/blog/agentic-coding) - Sourcegraph on supplying deterministic, large-codebase context and code intelligence so recurring agent runs reuse durable repository state instead of rediscovering it each time.
423
+ - 📝 **Blog** [Agentic AI State Management with ScyllaDB and LangGraph](https://www.scylladb.com/2026/04/08/agentic-ai-state-management-with-scylladb-and-langgraph/) - Durable agent state with checkpointers, write-ahead logs, and time-travel branching.
424
+ - 🧰 **Tool** [Mem0](https://github.com/mem0ai/mem0) - Open-source memory layer for retaining user, session, and agent state across repeated agent sessions.
425
+ - 🧰 **Tool** [Letta](https://github.com/letta-ai/letta) - Stateful agent framework from the MemGPT line with persistent, self-editing memory across runs.
426
+ - 🧰 **Tool** [Zep](https://github.com/getzep/zep) - Temporal knowledge graph memory that tracks how facts about users and systems change across sessions.
427
+ - 🧰 **Tool** [LangMem](https://github.com/langchain-ai/langmem) - SDK for extracting, consolidating, and retrieving long-term agent memory between loop runs.
428
+ - 🧰 **Tool** [Beads](https://github.com/steveyegge/beads) - Git-plus-SQLite issue and memory store that agents read and write with a `bd` CLI, giving recurring loops durable task state and progress that survives context resets.
429
+ - 📄 **Paper** [ARC: Active and Reflection-driven Context Management for Long-Horizon Agents](https://arxiv.org/abs/2601.12030) - Treats context as a managed runtime artifact, reorganizing the working context when degradation or context rot is detected across a long run.
430
+
431
+ ## Orchestration And Multi-Agent Delegation
432
+
433
+ - 🧰 **Tool** [AutoGen](https://github.com/microsoft/autogen) - Multi-agent programming framework for conversations, tool use, and orchestration; active development has moved to the Microsoft Agent Framework.
434
+ - 🧰 **Tool** [Microsoft Agent Framework](https://github.com/microsoft/agent-framework) - Microsoft's successor to AutoGen and Semantic Kernel for building and orchestrating multi-agent workflows in Python and .NET.
435
+ - 🧰 **Tool** [LangGraph](https://github.com/langchain-ai/langgraph) - Graph-based framework for controllable agent workflows, persistence, and human-in-the-loop steps.
436
+ - 🧰 **Tool** [CrewAI](https://github.com/crewAIInc/crewAI) - Framework for multi-agent workflows organized around roles, tasks, and crews.
437
+ - 📚 **Docs** [LlamaIndex Workflows](https://developers.llamaindex.ai/python/llamaagents/workflows/) - Event-driven workflow abstraction for agentic applications.
438
+ - 📚 **Docs** [OpenAI Agents SDK handoffs](https://openai.github.io/openai-agents-python/handoffs/) - First-class delegation between specialized agents.
439
+ - 📚 **Docs** [Agent Protocol](https://agentprotocol.ai/) - API protocol for agent interaction, useful for separating loop managers from agent runtimes.
440
+ - 🧰 **Tool** [AgentKit](https://github.com/inngest/agent-kit) - TypeScript toolkit for durable, event-driven agents on workflow infrastructure.
441
+ - 🧰 **Tool** [deepagents](https://github.com/langchain-ai/deepagents) - LangChain project for deeper, longer-running agents with middleware and harness patterns.
442
+ - 📚 **Docs** [Temporal for AI](https://temporal.io/solutions/ai) - Durable execution for long-running agent workflows: crash-proof state, automatic retries, and human-in-the-loop signals.
443
+ - 🧰 **Tool** [Restate](https://restate.dev/) - Durable execution runtime for building resilient, stateful agents and workflows that survive failures mid-loop.
444
+ - 🧰 **Tool** [DBOS](https://www.dbos.dev/) - Lightweight Postgres-backed durable execution library for crash-proof agent workflows, queues, and scheduled triggers.
445
+ - 🧰 **Tool** [Composio Agent Orchestrator](https://github.com/ComposioHQ/agent-orchestrator) - Orchestrates parallel coding agents in isolated worktrees that plan tasks, fix CI failures, respond to reviews, and manage their own PR lifecycle.
446
+
447
+ ## Benchmarks And Evaluation
448
+
449
+ - 🧪 **Benchmark** [SWE-bench](https://www.swebench.com/) - Benchmark for resolving real GitHub issues through code editing and tests.
450
+ - 📄 **Paper** [SWE-bench: Can Language Models Resolve Real-World GitHub Issues?](https://arxiv.org/abs/2310.06770) - Original SWE-bench paper.
451
+ - 📄 **Paper** [SWE-bench Goes Live](https://arxiv.org/abs/2505.23419) - Dynamic benchmark designed to reduce overfitting to static issue sets.
452
+ - 🧪 **Benchmark** [Terminal-Bench](https://www.tbench.ai/) - Benchmark for agents operating in terminal environments.
453
+ - 🧰 **Tool** [Terminal-Bench repository](https://github.com/harbor-framework/terminal-bench) - Open-source benchmark and harness for hard terminal tasks.
454
+ - 📄 **Paper** [AgentBench](https://arxiv.org/abs/2308.03688) - Multi-environment benchmark for evaluating LLMs as agents.
455
+ - 📄 **Paper** [WebArena](https://arxiv.org/abs/2307.13854) - Realistic web environment for autonomous agents.
456
+ - 📄 **Paper** [OSWorld](https://arxiv.org/abs/2404.07972) - Benchmark for multimodal agents operating full computer environments.
457
+ - 📄 **Paper** [ToolBench](https://arxiv.org/abs/2307.16789) - Tool-use benchmark and dataset for tool-augmented agents.
458
+ - 📄 **Paper** [GAIA](https://arxiv.org/abs/2311.12983) - Benchmark for general AI assistants requiring reasoning, tool use, and multi-step work.
459
+ - 📄 **Paper** [Tau-bench](https://arxiv.org/abs/2406.12045) - Benchmark for tool-agent-user interactions in realistic domains.
460
+ - 📄 **Paper** [VisualWebArena](https://arxiv.org/abs/2401.13649) - Visually grounded web-agent benchmark extending WebArena.
461
+ - 📄 **Paper** [AppWorld](https://arxiv.org/abs/2407.18901) - Benchmark of interactive app tasks with state-based and execution-based evaluation.
462
+ - 📄 **Paper** [Vending-Bench](https://arxiv.org/abs/2502.15840) - Benchmark for long-term coherence of autonomous agents; documents how small errors compound over very long loop horizons.
463
+ - 🧪 **Benchmark** [Vending-Bench leaderboard](https://andonlabs.com/evals/vending-bench) - Live long-horizon coherence results from Andon Labs.
464
+ - 📄 **Paper** [SWE-EVO: Benchmarking Coding Agents in Long-Horizon Software Evolution Scenarios](https://arxiv.org/abs/2512.18470) - Release-note-derived evolution tasks where agents score far below isolated-issue benchmarks, quantifying the long-horizon gap loops must manage.
465
+ - 📄 **Paper** [EvoSkills: Self-Evolving Agent Skills via Co-Evolutionary Verification](https://arxiv.org/abs/2604.01687) - A skill generator and a co-evolving surrogate verifier improve multi-file skill packages over iterations, evaluated on the SkillsBench benchmark of structured skill bundles.
466
+ - 📄 **Paper** [SlopCodeBench: Benchmarking How Coding Agents Degrade Over Long-Horizon Iterative Tasks](https://arxiv.org/abs/2603.24755) - Quantifies structural erosion and verbosity creep across iteration checkpoints in native harnesses like Claude Code and Codex, evidence for why loops need verification and budgets.
467
+ - 📄 **Paper** [LongCLI-Bench: A Preliminary Benchmark for Long-horizon Agentic Programming in Command-Line Interfaces](https://arxiv.org/abs/2602.14337) - Long-horizon CLI tasks where most runs stall below 30% completion, mapping where unattended loops break down.
468
+
469
+ ## Operations Playbooks
470
+
471
+ - 📝 **Blog** [Agentic Engineering: The Agent Loop](https://junpingyi.com/books/agentic-engineering/agent-loop/) - Minimal mental model for the loop underlying agent operation.
472
+ - 📝 **Blog** [The agent loop: ReAct, plan-and-execute, reflection](https://www.kunwar.page/chapter/067-the-agent-loop-react-plan-and-execute-reflection) - Practical walkthrough of the base loop and common variants.
473
+ - 📝 **Blog** [How to Build an Agent](https://ampcode.com/how-to-build-an-agent) - Thorsten Ball's demystification of the inner agent loop: a model, a loop, and enough tokens.
474
+ - 📝 **Blog** [Agentic Coding Recommendations](https://lucumr.pocoo.org/2025/6/12/agentic-coding/) - Armin Ronacher's field notes on which practices hold up when agents do most of the work.
475
+ - 📝 **Blog** [Coding Agents 101: The Art of Actually Getting Things Done](https://devin.ai/agents101) - Practical delegation guidance from the Devin team on scoping tasks agents can actually finish.
476
+ - 📝 **Blog** [How Anthropic teams use Claude Code](https://claude.com/blog/how-anthropic-teams-use-claude-code) - Cross-team field report of real recurring agent workflows in engineering, security, and data science.
477
+ - 📝 **Blog** [How Boris Uses Claude Code](https://howborisusesclaudecode.com/) - Unofficial but concrete compilation of Boris Cherny's autonomous setups: parallel worktrees, auto mode, `/loop`, `/schedule`, dynamic workflows, and `/goal` completion conditions.
478
+ - 📝 **Blog** [Agent of the Day: Copilot Agent PR Analysis](https://github.github.com/gh-aw/blog/2026-05-26-agent-of-the-day/) - Official walkthrough of a daily scheduled agentic workflow that ingests PR data, analyzes it, and publishes findings to a Discussion, a concrete recurring loop with trigger, intake, analysis, and output.
479
+
480
+ ## Templates And Patterns
481
+
482
+ Reusable patterns that contributors can turn into future examples, templates, or playbooks.
483
+
484
+ - 🧾 **Template** [Resource entry template](templates/resource-entry.md) - Format for adding a single resource with evidence quality and category fit.
485
+ - 🧾 **Template** [Loop pattern template](templates/loop-pattern.md) - Template for documenting an operational loop such as PR babysitting, CI repair, or feedback clustering.
486
+ - 🧾 **Template** [Loop contract schema](schemas/loop-contract.schema.json) - Machine-readable schema for portable loop specs.
487
+ - 🧾 **Template** [Loop contract preview script](scripts/preview_loop_contract.py) - Dependency-free demo that validates and renders a loop contract JSON file.
488
+ - 🧾 **Template** [Translation guide](TRANSLATIONS.md) - How to add or maintain a language translation without drifting from the canonical English list.
489
+ - 🧾 **Template** [Pattern library index](patterns/README.md) - Practical loop patterns with triggers, state, verification gates, budgets, and escalation paths.
490
+
491
+ Additional loop patterns worth documenting include PR babysitting, CI repair, feedback clustering, deploy verification, and docs drift collection.
492
+
493
+ ## Examples And Schema
494
+
495
+ Concrete examples make the loop contract easier to adapt to real repositories.
496
+
497
+ - 🔁 **Pattern** [Example loop specs](examples/README.md) - Human-readable walkthroughs for PR babysitting, CI repair, and docs drift collection.
498
+ - 🧾 **Template** [Loop contract library](examples/README.md#contract-library) - Schema-validated loop contracts for every pattern-library loop, from PR babysitting to model routing.
499
+ - 🧾 **Template** [Runnable test-repair loop](examples/runnable/test-repair-loop.sh) - Dependency-light reference loop script with a verification gate, retry budget, durable progress log, repeat-failure detection, and escalation exit.
500
+ - 🧾 **Template** [Runnable loop guide](examples/runnable/README.md) - Maps the script line by line to the Loop Contract and shows how to drive it with Claude Code, Codex CLI, or any agent CLI.
501
+
502
+ Preview an example locally:
503
+
504
+ ```sh
505
+ python3 scripts/preview_loop_contract.py examples/pr-babysitter-loop.json
506
+ ```
507
+
508
+ ## Community Gallery
509
+
510
+ The gallery is for real-world or realistic loop examples contributed by the community.
511
+
512
+ **Running a real loop?** Share it, real or anonymized, in the patterns discussion linked under Roadmap And Discussion below. Use the [minimum useful case study](gallery/README.md#minimum-useful-case-study) and [anonymization](gallery/README.md#safe-anonymization-checklist) checklists so others can learn from it safely.
513
+
514
+ - 🧾 **Template** [Loop gallery guide](gallery/README.md) - Quality bar for contributed loop examples with receipts and lessons learned.
515
+ - 🧾 **Template** [Loop gallery template](gallery/template.md) - Markdown template for sharing a loop's trigger, intake, state, verification, escalation, and safety notes.
516
+ - 🔁 **Pattern** [PR babysitter reference loop](gallery/pr-babysitter-reference.md) - Reference gallery entry for keeping a pull request moving.
517
+ - 🔁 **Pattern** [CI repair reference loop](gallery/ci-repair-reference.md) - Reference gallery entry for turning failing CI into a verified patch or escalation.
518
+ - 🔁 **Pattern** [Docs drift reference loop](gallery/docs-drift-reference.md) - Reference gallery entry for recurring docs/code consistency checks.
519
+
520
+ ## Discovery And Distribution
521
+
522
+ This repository includes a lightweight GitHub Pages landing page for search and social previews:
523
+
524
+ - 🧾 **Template** [Landing page](https://chaoyue0307.github.io/awesome-loop-engineering/) - SEO-friendly entry point for the repository.
525
+ - 🧾 **Template** [Landing page source](docs/index.html) - Source for the static landing page.
526
+ - 🧾 **Template** [Sitemap](docs/sitemap.xml) - Crawl hints for the landing page and core repository pages.
527
+ - 🧾 **Template** [Robots file](docs/robots.txt) - Allows indexing and points crawlers to the sitemap.
528
+
529
+ For launch copy and backlink strategy, use the [distribution checklist](meta/DISTRIBUTION.md).
530
+
531
+ ## Roadmap And Discussion
532
+
533
+ - 🧾 **Template** [Roadmap](ROADMAP.md) - Near-term work, pattern priorities, gallery goals, and open questions.
534
+ - 🧾 **Template** [Launch article](posts/launch.md) - Shareable explanation of the concept and repository.
535
+ - 🧾 **Template** [Discussion guide](meta/DISCUSSIONS.md) - Suggested discussion categories, starter prompts, and moderation standard.
536
+ - 🔁 **Pattern** [Show your Loop Engineering patterns](https://github.com/ChaoYue0307/awesome-loop-engineering/discussions/2) - Community discussion for real or anonymized loop examples.
537
+
538
+ ## Pattern Library
539
+
540
+ Practical loop patterns translate the abstract contract into runnable operating models. Each pattern documents the trigger, discover/intake step, agents, workspace, state, verification gates, retry budget, escalation path, and loop instruction.
541
+
542
+ - 🔁 **Pattern** [PR babysitter](patterns/pr-babysitter.md) - Repeatedly checks review comments, CI, merge conflicts, stale threads, and readiness to merge.
543
+ - 🔁 **Pattern** [CI repair loop](patterns/ci-repair-loop.md) - Reproduces failing checks, patches narrowly, reruns evidence, and escalates when failures are outside scope.
544
+ - 🔁 **Pattern** [Docs drift collector](patterns/docs-drift-collector.md) - Finds mismatches between docs and code, proposes small patches, and verifies examples.
545
+ - 🔁 **Pattern** [Deploy verifier](patterns/deploy-verifier.md) - Watches rollout signals, compares them with release expectations, and stops on anomalies.
546
+ - 🔁 **Pattern** [Feedback clusterer](patterns/feedback-clusterer.md) - Periodically groups GitHub, Linear, Slack, support, or social feedback into actionable themes.
547
+ - 🔁 **Pattern** [Dependency triage loop](patterns/dependency-triage-loop.md) - Classifies dependency updates, applies safe groups, verifies them, and escalates risky upgrades.
548
+ - 🔁 **Pattern** [Evaluation regression loop](patterns/evaluation-regression-loop.md) - Investigates degraded agent evals with baseline traces, targeted reruns, and repair proposals.
549
+ - 🔁 **Pattern** [Security review loop](patterns/security-review-loop.md) - Reviews sensitive diffs with evidence-backed findings, safe permissions, and human approval boundaries.
550
+ - 🔁 **Pattern** [Cost-control loop](patterns/cost-control-loop.md) - Monitors agent workflow spend, identifies waste, proposes scoped savings, and preserves quality gates.
551
+ - 🔁 **Pattern** [Bug hunting loop](patterns/bug-hunting-loop.md) - Discovers, reproduces, minimizes, and reports bugs with concrete evidence.
552
+ - 🔁 **Pattern** [Enterprise approval loop](patterns/enterprise-approval-loop.md) - Drives a permissioned change through required gates and approvers with a full audit trail.
553
+ - 🔁 **Pattern** [Incident response loop](patterns/incident-response-loop.md) - Triages an alert into an owned, evidence-backed incident with a postmortem seed.
554
+ - 🔁 **Pattern** [Data-quality loop](patterns/data-quality-loop.md) - Validates each dataset refresh against quality rules and quarantines bad versions.
555
+ - 🔁 **Pattern** [Release-note loop](patterns/release-note-loop.md) - Drafts release notes from merged commits, issues, and PRs with linked evidence.
556
+ - 🔁 **Pattern** [Model-routing loop](patterns/model-routing-loop.md) - Routes tasks across models on measured quality, latency, privacy, and cost.
557
+
558
+ ## Critiques, Risks, And Limitations
559
+
560
+ - ⚠️ **Critique** [Most Developers Do Not Need Agent Loops Yet](https://alphasignalai.substack.com/p/most-developers-do-not-need-agent) - Useful caution against adopting loops before the task, signal, and economics justify them.
561
+ - ⚠️ **Critique** [Engineering Agentic Systems for Reliability](https://pruningmypothos.com/systems/engineering-agentic-systems-for-reliability/) - Cautions that agentic systems fail at boundaries when permissions, verification, traceability, and escalation are weak.
562
+ - ⚠️ **Critique** [Self-Correcting Agents: Reflexion, CRITIC, and ReAct Loops Compared](https://callsphere.ai/blog/self-correcting-agents-reflexion-critic-react-loops-compared-2026) - Compares self-correction patterns and their cost/failure tradeoffs.
563
+ - ⚠️ **Critique** [How to Build an AI Agent Harness: A 2026 Complete Guide](https://atlan.com/know/how-to-build-ai-agent-harness/) - Broad guide with useful warnings on data readiness, permissions, context management, and evaluation.
564
+ - ⚠️ **Critique** [Harness Engineering vs Prompt Engineering vs Context Engineering Explained](https://medium.com/@visrow/harness-engineering-vs-prompt-engineering-vs-context-engineering-explained-0423b692c87d) - Adjacent framing that helps avoid confusing loop engineering with the surrounding harness discipline.
565
+
566
+ ## Adjacent Awesome Lists
567
+
568
+ - 🧭 **List** [Awesome Harness Engineering](https://github.com/ai-boost/awesome-harness-engineering) - Comprehensive list for the agent harness layer that Loop Engineering builds on.
569
+ - 🧭 **List** [Awesome Harness Engineering](https://github.com/walkinglabs/awesome-harness-engineering) - High-signal harness list with strong categories for context, guardrails, specs, evals, runtimes, and benchmarks.
570
+ - 🧭 **List** [Awesome Agent Harness](https://github.com/AutoJunjie/awesome-agent-harness) - Curated tools and resources for environments, constraints, and feedback around coding agents.
571
+ - 🧭 **List** [Awesome Context Engineering](https://github.com/Meirtz/Awesome-Context-Engineering) - Survey-style list for context engineering across LLMs and agents.
572
+ - 🧭 **List** [Awesome Prompt Engineering](https://github.com/promptslab/Awesome-Prompt-Engineering) - Classic adjacent list for prompt techniques and prompting resources.
573
+ - 🧭 **List** [Awesome LLM Agents](https://github.com/kaushikb11/awesome-llm-agents) - General list of LLM agent papers, frameworks, and applications.
574
+ - 🧭 **List** [Awesome AI Agents](https://github.com/e2b-dev/awesome-ai-agents) - Broad AI agent ecosystem map.
575
+ - 🧭 **List** [Awesome CLI Coding Agents](https://github.com/bradAGI/awesome-cli-coding-agents) - Directory of terminal-native coding agents, parallel runners, autonomous loops, and the harnesses that orchestrate them.
576
+ - 🧭 **List** [Awesome Self-Evolving Agents](https://github.com/XMUDeepLIT/Awesome-Self-Evolving-Agents) - Survey-style list of agents that improve themselves over repeated runs, an adjacent angle on long-running loops with memory and verification.
577
+
578
+ ## Contributing
579
+
580
+ Contributions are welcome. Please read [CONTRIBUTING.md](CONTRIBUTING.md) before opening a pull request.
581
+
582
+ This repository uses a strict [curation standard](meta/CURATION.md) to keep the list focused, verifiable, and useful for builders. Maintainers can use the [maintenance guide](meta/MAINTENANCE.md) for link checks, identity checks, and periodic refreshes.
583
+
584
+ For community expectations and support channels, see [CODE_OF_CONDUCT.md](CODE_OF_CONDUCT.md), [SUPPORT.md](SUPPORT.md), and [SECURITY.md](SECURITY.md).
585
+
586
+ Fast path for adding a resource:
587
+
588
+ - Check that it is about AI/coding-agent Loop Engineering or a direct foundation for it.
589
+ - Search the README to avoid duplicates.
590
+ - Pick the most specific category.
591
+ - Add one entry using this format:
592
+
593
+ ```md
594
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
595
+ ```
596
+
597
+ - Open a pull request and explain the category fit, source type, and why builders should care.
598
+
599
+ Fast path for contributing a loop pattern: start from the loop pattern template or loop contract schema, include trigger, discover/intake, delegation, workspace, context, verification, durable state, budget, escalation, and exit, then open a pattern suggestion issue if you want feedback before writing the full pattern.
600
+
601
+ Good submissions should answer three questions:
602
+
603
+ 1. Is this about the new AI/coding-agent meaning of Loop Engineering or a direct foundation for it?
604
+ 2. Does it help someone design, run, verify, evaluate, or critique recurring agent systems that coordinate prompting, context, harnesses, verification, and state?
605
+ 3. Is the source stable, public, and specific enough to be useful?
606
+
607
+ ## Citation
608
+
609
+ If this repository is useful in your work, please cite it with:
610
+
611
+ ```bibtex
612
+ @misc{chaoyue2026awesome_loop_engineering,
613
+ author = {He, Chaoyue},
614
+ title = {Awesome Loop Engineering},
615
+ year = {2026},
616
+ howpublished = {\url{https://github.com/ChaoYue0307/awesome-loop-engineering}},
617
+ note = {Curated resources for Loop Engineering}
618
+ }
619
+ ```
620
+
621
+ **Reusable blurb** (for blog posts, talks, internal docs, or community posts):
622
+
623
+ > Loop Engineering is the practice of designing recurring AI-agent and coding-agent systems that discover work, delegate to agents, verify results, persist state, and retry or escalate on a cadence or until a goal is reached. *Awesome Loop Engineering* is a curated, implementation-focused resource collection for this practice: [github.com/ChaoYue0307/awesome-loop-engineering](https://github.com/ChaoYue0307/awesome-loop-engineering)
README.pt-BR.md ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">Ajudar a traduzir</a>
19
+ </p>
20
+
21
+ > Uma lista curada e orientada à implementação para **Loop Engineering**: a camada acima de prompt, context e harness engineering para projetar sistemas recorrentes de agentes de IA.
22
+
23
+ Prompt engineering melhora o que você pede ao modelo. Context engineering melhora o que o modelo consegue ver. Harness engineering melhora ferramentas, permissões, sandboxes e verificações ao redor de uma execução de agente. **Loop Engineering fica acima das três**: projeta sistemas que acionam agentes, supervisionam, verificam resultados, persistem estado e executam novamente.
24
+
25
+ Um loop descobre trabalho, delega para um ou mais agentes, verifica o resultado, registra estado, decide a próxima ação e executa novamente em uma cadência ou até atingir um objetivo verificável.
26
+
27
+ Este repositório trata do novo significado de Loop Engineering no contexto de AI agents e coding agents. Ele não trata de event loops de software, teoria de controle, growth loops, automação genérica ou feedback loops não relacionados a IA.
28
+
29
+ ## Modelo Mental
30
+
31
+ - Prompt engineering pergunta: o que devo dizer ao modelo?
32
+ - Context engineering pergunta: que estado e conhecimento o modelo deve ver?
33
+ - Harness engineering pergunta: quais ferramentas, permissões, testes, sandboxes e feedback devem cercar o agente?
34
+ - Loop engineering pergunta: que sistema recorrente deve descobrir trabalho, delegar para agentes, verificar resultados, persistir estado, decidir próximas ações e rodar de novo?
35
+
36
+ Prompt, context e harness engineering melhoram uma execução. Loop Engineering torna o trabalho de agentes repetível, observável e governável ao longo do tempo.
37
+
38
+ ## Loop Contract
39
+
40
+ Um loop útil normalmente precisa deixar estes elementos visíveis:
41
+
42
+ | Parte | Pergunta de design | Artefato comum |
43
+ | ----------------- | ------------------------------------------ | ---------------------------------------------------------- |
44
+ | Objective | O que o loop deve otimizar? | Goal, issue, PRD, runbook |
45
+ | Trigger | Quando o loop roda? | Schedule, webhook, `/loop`, `/goal`, automation |
46
+ | Discover / Intake | Como o loop encontra trabalho? | GitHub query, Linear filter, CI failure, feedback stream |
47
+ | Workspace | Onde o agente pode agir com segurança? | Worktree, sandbox, branch, container |
48
+ | Context | Que conhecimento durável deve carregar? | `AGENTS.md`, `CLAUDE.md`, `SKILL.md`, docs |
49
+ | Delegation | Qual agente faz qual parte? | Explorer, implementer, reviewer, judge |
50
+ | Verification | O que decide sucesso ou falha? | Tests, typecheck, lint, evals, trace graders |
51
+ | State | O que sobrevive para a próxima execução? | Progress file, checkpoint, trace, issue comment |
52
+ | Budget | Quando deve parar de gastar? | Max turns, max retries, token budget, time box |
53
+ | Escalation | Quando uma pessoa assume? | PR, issue, Slack alert, triage inbox |
54
+ | Exit | Como o loop sabe que terminou? | Acceptance criteria, passing checks, no work found |
55
+
56
+ ## Modelo de Maturidade
57
+
58
+ | Nível | Nome | Descrição |
59
+ | ----- | -------------------------- | ---------------------------------------------------------------------------------------- |
60
+ | 0 | Manual prompting | Uma pessoa lê o estado e escreve o próximo prompt. |
61
+ | 1 | Scripted retry | Um script devolve erros ao agente. |
62
+ | 2 | Scheduled loop | O agente roda em uma cadência e reporta resultados. |
63
+ | 3 | Stateful loop | O progresso sobrevive por arquivos, issues, checkpoints ou traces. |
64
+ | 4 | Self-verifying loop | Checks determinísticos ou evaluator agents bloqueiam conclusões erradas. |
65
+ | 5 | Multi-agent loop | Agentes especializados dividem discovery, implementation, review e judgment. |
66
+ | 6 | Production-supervised loop | Observabilidade, budgets, approvals, rollback e escalonamento humano são centrais. |
67
+
68
+ ## Primeiras Leituras
69
+
70
+ A lista completa de recursos fica no README canônico em inglês: [README.md](README.md).
71
+
72
+ Leituras recomendadas:
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Define a mudança de prompting manual para sistemas que promptam, verificam e continuam.
75
+ - [Run long horizon tasks with Codex](https://developers.openai.com/blog/run-long-horizon-tasks-with-codex) - Runbook prático para plan-edit-test-observe-repair-document-repeat.
76
+ - [Run prompts on a schedule](https://code.claude.com/docs/en/scheduled-tasks) - Mecânica oficial para `/loop`, scheduled tasks e prompts recorrentes.
77
+ - [Building Effective Agents](https://www.anthropic.com/engineering/building-effective-agents) - Patterns componíveis para workflows e agentes.
78
+
79
+ ## Contribuir
80
+
81
+ Contribuições são bem-vindas. Leia [CONTRIBUTING.md](CONTRIBUTING.md) antes de abrir um pull request.
82
+
83
+ Fluxo rápido:
84
+
85
+ 1. Confirme que o recurso trata de Loop Engineering para AI/coding agents ou de uma base direta para isso.
86
+ 1. Pesquise no README para evitar duplicatas.
87
+ 1. Escolha a categoria mais específica.
88
+ 1. Adicione uma entrada neste formato:
89
+
90
+ ```md
91
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
92
+ ```
93
+
94
+ 1. Explique no PR a relevância, a categoria, o tipo de recurso e por que ele ajuda builders.
95
+
96
+ ## Traduções
97
+
98
+ Para manter ou adicionar um idioma, leia [TRANSLATIONS.md](TRANSLATIONS.md). As traduções devem preservar o escopo estreito: não incluir event loops, growth loops ou automação genérica.
README.zh-CN.md ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ <!-- last-synced: 2026-06-11 -->
4
+
5
+ <p align="center">
6
+ <img src="assets/awesome-loop-engineering-cover.png" alt="Awesome Loop Engineering cover" width="100%">
7
+ </p>
8
+
9
+ <p align="center">
10
+ <a href="README.md">English</a> |
11
+ <a href="README.zh-CN.md">中文</a> |
12
+ <a href="README.es.md">Español</a> |
13
+ <a href="README.fr.md">Français</a> |
14
+ <a href="README.de.md">Deutsch</a> |
15
+ <a href="README.ja.md">日本語</a> |
16
+ <a href="README.ko.md">한국어</a> |
17
+ <a href="README.pt-BR.md">Português</a> |
18
+ <a href="TRANSLATIONS.md">帮助翻译</a>
19
+ </p>
20
+
21
+ > 面向 **Loop Engineering** 的精选资源列表:它位于 prompt、context 和 harness engineering 之上,关注如何设计可重复运行的 AI-agent 系统。
22
+
23
+ Prompt engineering 改进你对模型说什么。Context engineering 改进模型能看到什么。Harness engineering 改进单次 agent 运行周围的工具、权限、沙箱和检查。**Loop Engineering 位于三者之上**:人不再逐轮手动提示 agent,而是设计一个循环系统,让它负责提示、监督、验证、更新状态并再次触发 agents。
24
+
25
+ 一个 loop 会发现工作、分派给一个或多个 agents、检查结果、记录状态、决定下一步,并按照节奏或直到满足可验证目标为止持续运行。
26
+
27
+ 本仓库不收录软件事件循环、控制论、增长循环、通用 workflow automation 或非 AI feedback loop。
28
+
29
+ ## 一句话定位
30
+
31
+ - Prompt engineering 关注:我应该对模型说什么?
32
+ - Context engineering 关注:模型应该看到什么状态和知识?
33
+ - Harness engineering 关注:agent 周围应该有什么工具、权限、测试、沙箱和反馈?
34
+ - Loop engineering 关注:当人不在内循环里时,什么系统负责发现工作、分派给 agents、验证结果、持久化状态、决定下一步并重新运行?
35
+
36
+ Prompt、context 和 harness engineering 让单次 agent 运行更好。Loop Engineering 让 agent 工作能跨时间重复、观察和治理。
37
+
38
+ ## Loop Contract
39
+
40
+ 一个有效的 loop 通常需要这些部分:
41
+
42
+ | 部分 | 设计问题 | 常见产物 |
43
+ | ----------------- | -------------- | ----------------------------------------------------- |
44
+ | Objective | loop 要优化什么? | goal、issue、PRD、runbook |
45
+ | Trigger | 什么时候运行? | schedule、webhook、`/loop`、`/goal`、automation |
46
+ | Discover / Intake | 如何发现工作? | GitHub query、Linear filter、CI failure、feedback stream |
47
+ | Workspace | agent 在哪里安全行动? | worktree、sandbox、branch、container |
48
+ | Context | 哪些知识应该长期存在? | `AGENTS.md`、`CLAUDE.md`、`SKILL.md`、docs |
49
+ | Delegation | 哪个 agent 负责什么? | explorer、implementer、reviewer、judge |
50
+ | Verification | 什么机制判断通过或失败? | tests、typecheck、lint、evals、trace graders |
51
+ | State | 下一轮需要保留什么? | progress file、checkpoint、trace、issue comment |
52
+ | Budget | 何时停止消耗? | max turns、max retries、token budget、time box |
53
+ | Escalation | 何时交给人? | PR、issue、Slack alert、triage inbox |
54
+ | Exit | loop 如何知道完成? | acceptance criteria、passing checks、no work found |
55
+
56
+ ## 成熟度模型
57
+
58
+ | 等级 | 名称 | 描述 |
59
+ | --- | -------------------------- | --------------------------------------------------------------- |
60
+ | 0 | Manual prompting | 人读取状态并写下一条 prompt。 |
61
+ | 1 | Scripted retry | 脚本把错误反馈给 agent。 |
62
+ | 2 | Scheduled loop | agent 按固定节奏运行并报告结果。 |
63
+ | 3 | Stateful loop | 通过文件、issue、checkpoint 或 trace 保留进度。 |
64
+ | 4 | Self-verifying loop | 用确定性检查或 evaluator agent 阻止错误完成。 |
65
+ | 5 | Multi-agent loop | discovery、implementation、review、judgment 由不同 agents 分工。 |
66
+ | 6 | Production-supervised loop | observability、budget、approval、rollback、human escalation 都是一等公民。 |
67
+
68
+ ## 必读入口
69
+
70
+ 完整资源列表以英文 README 为准:[README.md](README.md)。
71
+
72
+ 建议从这些直接讨论 Loop Engineering 的资料开始:
73
+
74
+ - [Loop Engineering](https://addyosmani.com/blog/loop-engineering/) - Addy Osmani 对 Loop Engineering 的核心定义和 Codex / Claude Code primitives 对照。
75
+ - [Loop Engineering](https://addyo.substack.com/p/loop-engineering) - 同文 Substack 版本,包含 Peter Steinberger 和 Boris Cherny 的相关引用。
76
+ - [Loop Engineering](https://cobusgreyling.substack.com/p/loop-engineering) - 简明解释从 prompt agents 到 design loops 的转变。
77
+ - [Loop Engineering: The Guide for AI Agents](https://lushbinary.com/blog/loop-engineering-ai-coding-agents-guide/) - 面向实践的 guide,拆解 automations、worktrees、skills、connectors、subagents 和 state。
78
+ - [Codex Loops: What Boris Cherny Gets Right About Managing Agent Work](https://www.developersdigest.tech/blog/codex-loops-boris-cherny-agent-routines) - 关于 PR babysitting、CI repair、deploy verification 和 feedback clustering 的 loop 思路。
79
+
80
+ ## 如何贡献内容
81
+
82
+ 欢迎提交 PR。请先阅读 [CONTRIBUTING.md](CONTRIBUTING.md)。
83
+
84
+ 最快流程:
85
+
86
+ 1. 确认资源属于 AI/coding-agent 语境的 Loop Engineering,或是它的直接基础。
87
+ 1. 在 README 中搜索,避免重复。
88
+ 1. 选择最具体的分类。
89
+ 1. 按这个格式添加一行:
90
+
91
+ ```md
92
+ - 📄 **Paper** [Title](https://example.com) - One sentence explaining the resource's contribution to Loop Engineering.
93
+ ```
94
+
95
+ 1. 在 PR 中说明:为什么相关、属于哪个分类、资源类型是什么、为什么对 builders 有用。
96
+
97
+ ## 翻译
98
+
99
+ 如果你想维护新的语言版本,请阅读 [TRANSLATIONS.md](TRANSLATIONS.md)。翻译应该保留概念边界:不要把 event loop、growth loop 或普通 automation 翻译进来。
100
+
101
+ ## 许可证
102
+
103
+ 本仓库中的原创整理文字、注释、模板、模式文档和仓库元数据使用 [CC0-1.0](LICENSE) 发布。
104
+
105
+ 本仓库链接到的第三方论文、博客、文档、工具、benchmark、图片和其他外部资源仍遵循其原作者或发布方各自的许可证和使用条款。本仓库只是索引和链接它们,并不重新授权这些外部内容。
ROADMAP.md ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Roadmap
2
+
3
+ This roadmap keeps Awesome Loop Engineering focused on useful, verifiable work for an emerging practice.
4
+
5
+ ## Near Term
6
+
7
+ - Collect more direct Loop Engineering sources as the term stabilizes.
8
+ - Add real or anonymized gallery entries from practitioners running recurring agent loops.
9
+ - Grow the runnable loop directory beyond the test-repair reference loop, including scheduled-trigger variants per runtime.
10
+ - Add more translations for the introduction, mental model, Loop Contract, and contribution guide.
11
+ - Continue replacing weak or unstable links with primary sources, official docs, papers, and implementation-heavy write-ups.
12
+
13
+ ## Pattern Library
14
+
15
+ Completed reference patterns now cover PR babysitting, CI repair, docs drift, deploy verification, feedback clustering, dependency triage, evaluation regression, security review, cost-control, and bug hunting. Every pattern now ships a schema-validated loop contract in `examples/`.
16
+
17
+ Next pattern-library work should focus on variants backed by operational evidence:
18
+
19
+ - enterprise approval loops for permissioned agents;
20
+ - incident response loops with pager handoff and postmortem evidence;
21
+ - data-quality loops for repeated dataset or knowledge-base refresh;
22
+ - release-note loops that connect commits, issues, docs, and changelogs;
23
+ - model-routing loops that balance quality, latency, privacy, and cost.
24
+
25
+ ## Gallery
26
+
27
+ The gallery should grow from reference examples into public or anonymized case studies. Good entries should include:
28
+
29
+ - the runtime or agent tool used;
30
+ - trigger and intake source;
31
+ - verification gates;
32
+ - durable state artifact;
33
+ - budget and escalation rules;
34
+ - receipts or anonymized evidence;
35
+ - lessons learned after real use.
36
+
37
+ ## Quality And Governance
38
+
39
+ - Keep CI dependency-light and easy for contributors to run locally.
40
+ - Keep all resource annotations tied to recurring agent systems, not generic AI-agent interest.
41
+ - Keep public claims conservative: this repository is an early curated field guide, not a finished standard.
42
+ - Preserve clean owner-only commit identity for `main`.
43
+
44
+ ## Open Questions
45
+
46
+ - Which loop primitives become common across Codex, Claude Code, GitHub Agentic Workflows, and custom runtimes?
47
+ - What is the right schema shape for portable loop contracts?
48
+ - Which verification gates are strong enough for unattended or semi-attended loops?
49
+ - How should maintainers evaluate submitted real-world loop examples without exposing private data?
SECURITY.md ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Security Policy
2
+
3
+ This repository is a curated documentation and resource list. It does not ship a production service, package, or runtime. Security concerns can still appear in examples, scripts, links, or contribution material.
4
+
5
+ ## Please Report
6
+
7
+ - A linked resource that appears malicious or impersonates another project.
8
+ - A script or example that could cause unsafe actions if copied directly.
9
+ - Accidentally committed credentials, tokens, private URLs, or sensitive data.
10
+ - Guidance that could encourage unsafe production autonomy without approvals or escalation.
11
+
12
+ ## How To Report
13
+
14
+ Open a private security advisory if GitHub offers that option for this repository. If not, open an issue with sensitive details removed and ask for a maintainer response.
15
+
16
+ Do not post secrets, private customer data, exploit details, or internal URLs in public issues or pull requests.
17
+
18
+ ## Security Review Standard
19
+
20
+ Loop Engineering examples should be conservative:
21
+
22
+ - sensitive actions require human approval;
23
+ - production actions should be read-only by default unless explicitly scoped;
24
+ - credentials and secrets must never be included in examples;
25
+ - loops should have retry budgets, exit conditions, and escalation paths;
26
+ - verification should rely on concrete evidence, not only model self-assessment.
SUPPORT.md ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Support
2
+
3
+ This repository is maintained as a public field guide and curated resource list for Loop Engineering.
4
+
5
+ ## Best Channels
6
+
7
+ - **Resource suggestions**: use the resource suggestion issue template.
8
+ - **Loop patterns**: use the loop pattern suggestion issue template or the pinned community pattern issue.
9
+ - **Corrections**: open a pull request when the fix is clear, or open an issue if it needs discussion.
10
+ - **Translations**: use the translation proposal issue template and follow `TRANSLATIONS.md`.
11
+ - **Security concerns**: follow `SECURITY.md`.
12
+
13
+ ## What Maintainers Can Help With
14
+
15
+ - deciding whether a resource fits the narrow AI/coding-agent meaning of Loop Engineering;
16
+ - improving annotations, categories, and source quality;
17
+ - reviewing loop pattern contracts for trigger, intake, verification, state, budget, escalation, and exit;
18
+ - fixing broken links or replacing unstable sources.
19
+
20
+ ## What Is Out Of Scope
21
+
22
+ - product support for third-party agent tools;
23
+ - private consulting on proprietary loops;
24
+ - generic prompt engineering questions with no loop, state, verification, or recurring system angle;
25
+ - unrelated software event loops, growth loops, control theory loops, or generic automation.
TAXONOMY.md ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Loop Engineering Taxonomy
2
+
3
+ This taxonomy gives contributors a shared vocabulary for classifying AI-agent loops.
4
+
5
+ ## By Trigger
6
+
7
+ - **Scheduled loop**: runs on a cadence such as hourly, daily, weekly, or during a rollout window.
8
+ - **Event-triggered loop**: starts from a webhook, failed check, new comment, issue label, release event, or alert.
9
+ - **Goal-driven loop**: continues until a verifiable goal is met, such as passing tests or resolving all blocking comments.
10
+ - **Manual bootstrap loop**: starts from a human command, then follows a repeatable contract with state, verification, and exit rules.
11
+
12
+ ## By Work Intake
13
+
14
+ - **Queue loop**: consumes work from issues, PRs, tickets, alerts, feedback streams, or triage inboxes.
15
+ - **Scan loop**: periodically searches a repository, dashboard, logs, docs, or benchmark output for new work.
16
+ - **Reactive loop**: responds to a specific failure signal such as CI, eval regression, deploy anomaly, or user report.
17
+
18
+ ## By Verification
19
+
20
+ - **Deterministic loop**: uses tests, typechecks, lint, schemas, dashboards, or threshold checks as the main gate.
21
+ - **Evaluator loop**: uses a second model, rubric, reviewer, or judge agent to evaluate output.
22
+ - **Human-supervised loop**: requires human approval before sensitive actions or before completion is accepted.
23
+ - **Receipt-based loop**: records evidence such as commands, logs, trace IDs, screenshots, PR links, or issue comments.
24
+
25
+ ## By State Model
26
+
27
+ - **Stateless retry loop**: feeds immediate failure evidence back into one session. Useful but fragile.
28
+ - **File-backed loop**: stores progress in `PROGRESS.md`, task files, runbooks, or generated reports.
29
+ - **Issue-backed loop**: stores progress in GitHub, Linear, Jira, Slack, or another system of record.
30
+ - **Checkpointed loop**: persists structured state in a database, workflow engine, trace store, or event log.
31
+
32
+ ## By Agent Topology
33
+
34
+ - **Single-agent loop**: one agent acts, with deterministic checks or human review.
35
+ - **Maker-checker loop**: one agent changes the artifact and another verifies it.
36
+ - **Manager-worker loop**: an orchestrator decomposes work and assigns specialized agents.
37
+ - **Adversarial loop**: reviewer, critic, or security agents try to falsify the maker's output.
38
+
39
+ ## By Operating Domain
40
+
41
+ - **Repository loop**: PR babysitting, CI repair, bug hunting, docs drift, dependency triage.
42
+ - **Release loop**: deploy verification, canary monitoring, rollback recommendation, incident handoff.
43
+ - **Feedback loop**: user feedback clustering, issue deduplication, community triage, roadmap signal collection.
44
+ - **Evaluation loop**: recurring benchmark runs, trace review, regression detection, prompt or harness hill-climbing.
45
+
46
+ ## Maturity Path
47
+
48
+ Most teams should move in this order:
49
+
50
+ 1. Manual bootstrap loop with explicit state.
51
+ 1. Scheduled or event-triggered loop with deterministic gates.
52
+ 1. Maker-checker loop with durable receipts.
53
+ 1. Multi-agent or workflow-backed loop.
54
+ 1. Production-supervised loop with observability, approvals, budgets, and rollback rules.
55
+
56
+ Higher maturity is not automatically better. The right loop is the simplest loop that can safely discover work, delegate, verify, persist state, decide the next action, and stop.
TRANSLATIONS.md ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Translations
2
+
3
+ The canonical list is [README.md](README.md). Translations should help more readers understand Loop Engineering without drifting from the repository's scope.
4
+
5
+ ## Available
6
+
7
+ - [English](README.md)
8
+ - [中文](README.zh-CN.md)
9
+ - [Español](README.es.md)
10
+ - [Français](README.fr.md)
11
+ - [Deutsch](README.de.md)
12
+ - [日本語](README.ja.md)
13
+ - [한국어](README.ko.md)
14
+ - [Português](README.pt-BR.md)
15
+
16
+ ## Wanted
17
+
18
+ Maintainers and contributors are welcome for:
19
+
20
+ - Русский
21
+ - Italiano
22
+ - العربية
23
+ - हिन्दी
24
+
25
+ ## Translation Rules
26
+
27
+ - Preserve the narrow definition: AI/coding-agent Loop Engineering as the layer above prompt, context, and harness engineering.
28
+ - Do not translate unrelated meanings into scope: event loops, control theory, growth loops, generic automation, or non-AI feedback loops.
29
+ - Keep the English README as the source of truth for the full resource list.
30
+ - Prefer translating the introduction, mental model, Loop Contract, maturity model, and contribution instructions first.
31
+ - If you translate the full resource list, keep URLs unchanged and translate only annotations.
32
+ - Add yourself as a translation maintainer in your PR if you can help keep the file current.
33
+ - Every translation carries a `<!-- last-synced: YYYY-MM-DD -->` marker near the top. When you review a translation against the current English README, bump the date. CI fails when a marker is missing or older than 180 days.
34
+
35
+ ## Suggested File Names
36
+
37
+ - `README.de.md`
38
+ - `README.es.md`
39
+ - `README.fr.md`
40
+ - `README.ja.md`
41
+ - `README.ko.md`
42
+ - `README.pt-BR.md`
43
+ - `README.ru.md`
44
+
45
+ ## Translation PR Checklist
46
+
47
+ - [ ] The translation links back to the canonical English README.
48
+ - [ ] The language switcher has been updated in `README.md`.
49
+ - [ ] The `<!-- last-synced: YYYY-MM-DD -->` marker is present and current.
50
+ - [ ] The translation preserves the scope boundary.
51
+ - [ ] Resource URLs are unchanged.
52
+ - [ ] Technical terms are translated consistently or left in English where that is clearer.
assets/README.md ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ # Assets
2
+
3
+ This directory contains visual assets used by the repository README, GitHub Pages landing page, and social previews.
4
+
5
+ - `awesome-loop-engineering-cover.png` - Wide social and README cover image. It visualizes the Prompt, Context, Harness, and Loop stack.
6
+ - `loop-engineering-stack.svg` - Lightweight stack diagram showing how Loop Engineering sits above prompt, context, and harness engineering.
7
+ - `loop-contract-cards.svg` - Visual card grid for the Loop Contract: objective, trigger, intake, workspace, context, delegation, verification, state, budget, escalation, and exit.
8
+ - `loop-lifecycle.svg` - One pass of a recurring loop: Intake, Delegate, Act, Verify, Persist, and Decide, where Decide retries, escalates, or exits.
9
+
10
+ Please keep assets lightweight and directly useful for repository presentation. Avoid adding screenshots or large generated files unless they improve the README or documentation experience.
assets/awesome-loop-engineering-cover.png ADDED

Git LFS Details

  • SHA256: acd8e211f411d336d27eacc80ed358effc3360e1dcf16e84c1b354778ec528b0
  • Pointer size: 131 Bytes
  • Size of remote file: 866 kB
assets/loop-contract-cards.svg ADDED
assets/loop-engineering-stack.svg ADDED
assets/loop-lifecycle.svg ADDED
docs/.nojekyll ADDED
@@ -0,0 +1 @@
 
 
1
+
docs/index.html ADDED
@@ -0,0 +1,293 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!doctype html>
2
+ <html lang="en">
3
+ <head>
4
+ <meta charset="utf-8">
5
+ <meta name="viewport" content="width=device-width, initial-scale=1">
6
+ <title>Awesome Loop Engineering</title>
7
+ <meta name="description" content="A curated field guide to Loop Engineering: designing recurring AI-agent systems above prompt, context, and harness engineering.">
8
+ <meta name="robots" content="index,follow">
9
+ <link rel="canonical" href="https://chaoyue0307.github.io/awesome-loop-engineering/">
10
+ <meta property="og:type" content="website">
11
+ <meta property="og:title" content="Awesome Loop Engineering">
12
+ <meta property="og:description" content="Curated resources, patterns, examples, schema, and field guides for recurring AI-agent systems.">
13
+ <meta property="og:url" content="https://chaoyue0307.github.io/awesome-loop-engineering/">
14
+ <meta property="og:image" content="https://raw.githubusercontent.com/ChaoYue0307/awesome-loop-engineering/main/assets/awesome-loop-engineering-cover.png">
15
+ <meta name="twitter:card" content="summary_large_image">
16
+ <meta name="twitter:title" content="Awesome Loop Engineering">
17
+ <meta name="twitter:description" content="A field guide for designing recurring AI-agent systems above prompt, context, and harness engineering.">
18
+ <meta name="twitter:image" content="https://raw.githubusercontent.com/ChaoYue0307/awesome-loop-engineering/main/assets/awesome-loop-engineering-cover.png">
19
+ <style>
20
+ :root {
21
+ color-scheme: dark;
22
+ --bg: #0f172a;
23
+ --panel: #111827;
24
+ --muted: #cbd5e1;
25
+ --text: #f8fafc;
26
+ --accent: #38bdf8;
27
+ --accent-2: #a78bfa;
28
+ --border: rgba(148, 163, 184, 0.24);
29
+ }
30
+ * {
31
+ box-sizing: border-box;
32
+ }
33
+ body {
34
+ margin: 0;
35
+ background:
36
+ radial-gradient(circle at 10% 0%, rgba(56, 189, 248, 0.22), transparent 26rem),
37
+ radial-gradient(circle at 90% 10%, rgba(167, 139, 250, 0.2), transparent 28rem),
38
+ var(--bg);
39
+ color: var(--text);
40
+ font-family: Inter, ui-sans-serif, system-ui, -apple-system, BlinkMacSystemFont, "Segoe UI", sans-serif;
41
+ line-height: 1.6;
42
+ }
43
+ a {
44
+ color: #7dd3fc;
45
+ text-decoration: none;
46
+ }
47
+ a:hover {
48
+ text-decoration: underline;
49
+ }
50
+ main {
51
+ width: min(1120px, calc(100% - 32px));
52
+ margin: 0 auto;
53
+ padding: 48px 0 72px;
54
+ }
55
+ .hero {
56
+ display: grid;
57
+ gap: 28px;
58
+ grid-template-columns: minmax(0, 1.1fr) minmax(280px, 0.9fr);
59
+ align-items: center;
60
+ }
61
+ .eyebrow {
62
+ color: var(--accent);
63
+ font-size: 0.82rem;
64
+ font-weight: 800;
65
+ letter-spacing: 0.14em;
66
+ text-transform: uppercase;
67
+ }
68
+ h1 {
69
+ margin: 10px 0 18px;
70
+ font-size: clamp(2.4rem, 6vw, 5.4rem);
71
+ line-height: 0.95;
72
+ letter-spacing: -0.055em;
73
+ }
74
+ .lead {
75
+ max-width: 760px;
76
+ color: var(--muted);
77
+ font-size: clamp(1.08rem, 2vw, 1.3rem);
78
+ }
79
+ .actions {
80
+ display: flex;
81
+ flex-wrap: wrap;
82
+ gap: 12px;
83
+ margin-top: 28px;
84
+ }
85
+ .button {
86
+ border: 1px solid var(--border);
87
+ border-radius: 999px;
88
+ padding: 11px 18px;
89
+ background: rgba(15, 23, 42, 0.72);
90
+ color: var(--text);
91
+ font-weight: 700;
92
+ }
93
+ .button.primary {
94
+ border-color: transparent;
95
+ background: linear-gradient(90deg, var(--accent), var(--accent-2));
96
+ color: #08111f;
97
+ }
98
+ .visual {
99
+ border: 1px solid var(--border);
100
+ border-radius: 28px;
101
+ overflow: hidden;
102
+ background: rgba(17, 24, 39, 0.74);
103
+ box-shadow: 0 24px 80px rgba(0, 0, 0, 0.28);
104
+ }
105
+ .visual img {
106
+ display: block;
107
+ width: 100%;
108
+ }
109
+ .wide-visual {
110
+ border: 1px solid var(--border);
111
+ border-radius: 28px;
112
+ overflow: hidden;
113
+ background: rgba(17, 24, 39, 0.72);
114
+ box-shadow: 0 24px 80px rgba(0, 0, 0, 0.24);
115
+ }
116
+ .wide-visual img {
117
+ display: block;
118
+ width: 100%;
119
+ }
120
+ .section {
121
+ margin-top: 56px;
122
+ }
123
+ .grid {
124
+ display: grid;
125
+ gap: 16px;
126
+ grid-template-columns: repeat(3, minmax(0, 1fr));
127
+ }
128
+ .card {
129
+ min-height: 100%;
130
+ border: 1px solid var(--border);
131
+ border-radius: 22px;
132
+ padding: 22px;
133
+ background: rgba(17, 24, 39, 0.72);
134
+ }
135
+ .card h2,
136
+ .card h3 {
137
+ margin: 0 0 10px;
138
+ line-height: 1.2;
139
+ }
140
+ .card p,
141
+ .card li {
142
+ color: var(--muted);
143
+ }
144
+ .stack {
145
+ display: grid;
146
+ gap: 12px;
147
+ }
148
+ .layer {
149
+ border: 1px solid var(--border);
150
+ border-radius: 18px;
151
+ padding: 16px 18px;
152
+ background: rgba(15, 23, 42, 0.76);
153
+ }
154
+ .layer strong {
155
+ color: var(--text);
156
+ }
157
+ .definition {
158
+ border-left: 4px solid var(--accent);
159
+ padding: 18px 22px;
160
+ border-radius: 16px;
161
+ background: rgba(15, 23, 42, 0.76);
162
+ color: var(--muted);
163
+ }
164
+ footer {
165
+ margin-top: 64px;
166
+ color: #94a3b8;
167
+ font-size: 0.95rem;
168
+ }
169
+ @media (max-width: 850px) {
170
+ .hero,
171
+ .grid {
172
+ grid-template-columns: 1fr;
173
+ }
174
+ main {
175
+ padding-top: 28px;
176
+ }
177
+ }
178
+ </style>
179
+ <script type="application/ld+json">
180
+ {
181
+ "@context": "https://schema.org",
182
+ "@type": "CollectionPage",
183
+ "name": "Awesome Loop Engineering",
184
+ "url": "https://chaoyue0307.github.io/awesome-loop-engineering/",
185
+ "description": "A curated field guide to Loop Engineering: designing recurring AI-agent systems above prompt, context, and harness engineering.",
186
+ "isPartOf": {
187
+ "@type": "WebSite",
188
+ "name": "Awesome Loop Engineering",
189
+ "url": "https://github.com/ChaoYue0307/awesome-loop-engineering"
190
+ },
191
+ "about": [
192
+ "Loop Engineering",
193
+ "AI agents",
194
+ "Coding agents",
195
+ "Agent workflows"
196
+ ],
197
+ "author": {
198
+ "@type": "Person",
199
+ "name": "Chaoyue He"
200
+ }
201
+ }
202
+ </script>
203
+ </head>
204
+ <body>
205
+ <main>
206
+ <section class="hero">
207
+ <div>
208
+ <div class="eyebrow">Awesome Loop Engineering</div>
209
+ <h1>Design loops, not just prompts.</h1>
210
+ <p class="lead">
211
+ Loop Engineering is the AI and coding-agent practice of designing recurring systems that discover work, delegate it to agents, verify results, persist state, decide next actions, and run again.
212
+ </p>
213
+ <div class="actions">
214
+ <a class="button primary" href="https://github.com/ChaoYue0307/awesome-loop-engineering">Open GitHub Repo</a>
215
+ <a class="button" href="https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/DEFINITION.md">Read Definition</a>
216
+ <a class="button" href="https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/examples/README.md">See Examples</a>
217
+ </div>
218
+ </div>
219
+ <div class="visual">
220
+ <img src="https://raw.githubusercontent.com/ChaoYue0307/awesome-loop-engineering/main/assets/loop-engineering-stack.svg" alt="Loop Engineering stack diagram">
221
+ </div>
222
+ </section>
223
+
224
+ <section class="section">
225
+ <div class="definition">
226
+ <strong>Canonical definition:</strong>
227
+ Loop Engineering is the AI and coding-agent practice of designing recurring systems that discover work, delegate it to agents, verify results, persist state, decide next actions, and run again on a cadence, event, or until a verifiable goal is reached.
228
+ </div>
229
+ </section>
230
+
231
+ <section class="section wide-visual" aria-label="Loop Contract visual">
232
+ <img src="https://raw.githubusercontent.com/ChaoYue0307/awesome-loop-engineering/main/assets/loop-contract-cards.svg" alt="Loop Contract cards">
233
+ </section>
234
+
235
+ <section class="section wide-visual" aria-label="Loop Engineering lifecycle visual">
236
+ <img src="https://raw.githubusercontent.com/ChaoYue0307/awesome-loop-engineering/main/assets/loop-lifecycle.svg" alt="Loop Engineering lifecycle: Intake, Delegate, Act, Verify, Persist, Decide; Decide retries by feeding evidence back, escalates to a human, or exits when the goal is met">
237
+ </section>
238
+
239
+ <section class="section grid" aria-label="Engineering stack">
240
+ <div class="card">
241
+ <h2>The Stack</h2>
242
+ <div class="stack">
243
+ <div class="layer"><strong>Prompt Engineering</strong><br>What should I say to the model?</div>
244
+ <div class="layer"><strong>Context Engineering</strong><br>What state and knowledge should the model see?</div>
245
+ <div class="layer"><strong>Harness Engineering</strong><br>What tools, permissions, tests, and sandboxes surround one run?</div>
246
+ <div class="layer"><strong>Loop Engineering</strong><br>What recurring system governs agent work over time?</div>
247
+ </div>
248
+ </div>
249
+ <div class="card">
250
+ <h2>What The Repo Contains</h2>
251
+ <ul>
252
+ <li>Curated papers, blogs, docs, tools, benchmarks, and patterns.</li>
253
+ <li>Manifesto, taxonomy, comparison guide, and anti-patterns.</li>
254
+ <li>Validated loop contract schema and example loop specs.</li>
255
+ <li>Pattern library for PR, CI, docs, deploy, feedback, dependency, eval, security, cost, and bug-hunting loops.</li>
256
+ </ul>
257
+ </div>
258
+ <div class="card">
259
+ <h2>Contribute</h2>
260
+ <p>
261
+ Share resources, corrections, or real loop patterns with trigger, intake, delegation, verification, state, budget, escalation, and receipts.
262
+ </p>
263
+ <p><a href="https://github.com/ChaoYue0307/awesome-loop-engineering/issues/1">Join the community pattern thread</a></p>
264
+ </div>
265
+ </section>
266
+
267
+ <section class="section grid" aria-label="Key links">
268
+ <div class="card">
269
+ <h3>Start Here</h3>
270
+ <p>Use the README for the complete curated map and contribution path.</p>
271
+ <p><a href="https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/README.md">Read the README</a></p>
272
+ </div>
273
+ <div class="card">
274
+ <h3>Field Guides</h3>
275
+ <p>Understand the concept, boundaries, taxonomy, anti-patterns, and comparisons.</p>
276
+ <p><a href="https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/MANIFESTO.md">Read the Manifesto</a></p>
277
+ </div>
278
+ <div class="card">
279
+ <h3>Build A Loop</h3>
280
+ <p>Start from validated JSON specs or the pattern template.</p>
281
+ <p><a href="https://github.com/ChaoYue0307/awesome-loop-engineering/tree/main/examples">View examples</a></p>
282
+ </div>
283
+ </section>
284
+
285
+ <footer>
286
+ <p>
287
+ This is an early curated map of an emerging practice, not a final standard.
288
+ Original repository materials are released under CC0-1.0.
289
+ </p>
290
+ </footer>
291
+ </main>
292
+ </body>
293
+ </html>
docs/llms.txt ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Awesome Loop Engineering
2
+
3
+ > Curated resources and practical patterns for Loop Engineering: the practice of designing recurring AI-agent and coding-agent systems that discover work, delegate to agents, verify results, persist state, and run again on a cadence or until a verifiable goal is reached.
4
+
5
+ ## Core
6
+
7
+ - [README](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/README.md): the curated list with the Loop Contract, design checklist, and maturity model
8
+ - [Canonical definition](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/DEFINITION.md): short definition, positioning, and minimal loop test
9
+ - [Taxonomy](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/TAXONOMY.md): classification by trigger, intake, verification, state model, and topology
10
+ - [Anti-patterns](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/ANTI-PATTERNS.md): common loop failure modes
11
+
12
+ ## Patterns
13
+
14
+ - [Pattern library](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/patterns/README.md): operational loop patterns with triggers, gates, budgets, and escalation
15
+ - [Loop contracts](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/examples/README.md): schema-validated contract JSON for every pattern, plus runnable reference loops
16
+
17
+ ## Optional
18
+
19
+ - [Landing page](https://chaoyue0307.github.io/awesome-loop-engineering/)
20
+ - [Contributing](https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/CONTRIBUTING.md)
docs/robots.txt ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ User-agent: *
2
+ Allow: /
3
+
4
+ Sitemap: https://chaoyue0307.github.io/awesome-loop-engineering/sitemap.xml
docs/sitemap.xml ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
3
+ <url>
4
+ <loc>https://chaoyue0307.github.io/awesome-loop-engineering/</loc>
5
+ <changefreq>weekly</changefreq>
6
+ <priority>1.0</priority>
7
+ </url>
8
+ <url>
9
+ <loc>https://github.com/ChaoYue0307/awesome-loop-engineering</loc>
10
+ <changefreq>weekly</changefreq>
11
+ <priority>0.9</priority>
12
+ </url>
13
+ <url>
14
+ <loc>https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/DEFINITION.md</loc>
15
+ <changefreq>monthly</changefreq>
16
+ <priority>0.8</priority>
17
+ </url>
18
+ <url>
19
+ <loc>https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/MANIFESTO.md</loc>
20
+ <changefreq>monthly</changefreq>
21
+ <priority>0.8</priority>
22
+ </url>
23
+ <url>
24
+ <loc>https://github.com/ChaoYue0307/awesome-loop-engineering/blob/main/examples/README.md</loc>
25
+ <changefreq>monthly</changefreq>
26
+ <priority>0.7</priority>
27
+ </url>
28
+ </urlset>
examples/README.md ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Loop Examples
2
+
3
+ These examples show how to turn the abstract loop contract into concrete operating specs.
4
+
5
+ ## Contract Library
6
+
7
+ Every loop in the [pattern library](../patterns/README.md) has a matching contract. Each JSON file follows [`schemas/loop-contract.schema.json`](../schemas/loop-contract.schema.json) and is validated in CI:
8
+
9
+ - [`pr-babysitter-loop.json`](pr-babysitter-loop.json)
10
+ - [`ci-repair-loop.json`](ci-repair-loop.json)
11
+ - [`docs-drift-loop.json`](docs-drift-loop.json)
12
+ - [`deploy-verifier-loop.json`](deploy-verifier-loop.json)
13
+ - [`feedback-clusterer-loop.json`](feedback-clusterer-loop.json)
14
+ - [`dependency-triage-loop.json`](dependency-triage-loop.json)
15
+ - [`evaluation-regression-loop.json`](evaluation-regression-loop.json)
16
+ - [`security-review-loop.json`](security-review-loop.json)
17
+ - [`cost-control-loop.json`](cost-control-loop.json)
18
+ - [`bug-hunting-loop.json`](bug-hunting-loop.json)
19
+ - [`enterprise-approval-loop.json`](enterprise-approval-loop.json)
20
+ - [`incident-response-loop.json`](incident-response-loop.json)
21
+ - [`data-quality-loop.json`](data-quality-loop.json)
22
+ - [`release-note-loop.json`](release-note-loop.json)
23
+ - [`model-routing-loop.json`](model-routing-loop.json)
24
+
25
+ Use them as starting points. Adapt triggers, tools, checks, state artifacts, and escalation rules to your repository and runtime.
26
+
27
+ ## Runnable Loops
28
+
29
+ The [runnable directory](runnable/README.md) contains working loop scripts, starting with a dependency-light test-repair loop you can drive with Claude Code, Codex CLI, or any agent CLI.
30
+
31
+ ## PR Babysitter
32
+
33
+ Use when a PR needs recurring attention but should not require a human to poll comments, checks, conflicts, and stale review state.
34
+
35
+ Example loop instruction:
36
+
37
+ ```text
38
+ Every 2 hours during working hours, inspect PR <number>.
39
+ Load review comments, check status, mergeability, linked issues, and project instructions.
40
+ If there is a narrow mechanical blocker, patch it in an isolated worktree and run the smallest relevant checks.
41
+ Record commands, changed files, check URLs, and remaining blockers in a PR comment.
42
+ Stop when the PR is merge-ready, waiting only on human review, blocked, or out of retry budget.
43
+ ```
44
+
45
+ Good gates:
46
+
47
+ - required checks pass;
48
+ - unresolved comments are answered or resolved;
49
+ - merge conflicts are gone;
50
+ - diff is limited to the stated blocker.
51
+
52
+ ## CI Repair Loop
53
+
54
+ Use when failing CI should be turned into either a small verified patch or an escalation note.
55
+
56
+ Example loop instruction:
57
+
58
+ ```text
59
+ When a required CI check fails, inspect the failing check, logs, artifacts, changed files, and recent successful run.
60
+ Identify the exact failing command or closest local equivalent.
61
+ Patch only the smallest log-backed cause, rerun the failing command first, and summarize evidence.
62
+ Escalate instead of changing tests, broad CI config, dependencies, or unrelated files without proof.
63
+ ```
64
+
65
+ Good gates:
66
+
67
+ - the original failing command passes locally or in rerun CI;
68
+ - the patch is limited to the failure cause;
69
+ - behavior changes include focused tests;
70
+ - the report includes the failing log excerpt and passing output.
71
+
72
+ ## Docs Drift Collector
73
+
74
+ Use when docs need periodic alignment with code, CLI behavior, schemas, or examples.
75
+
76
+ Example loop instruction:
77
+
78
+ ```text
79
+ Weekly, scan changed files, public docs, examples, generated API references, CLI help, and docs-related issues.
80
+ Confirm each possible drift item against code, schema, tests, or runtime output before editing.
81
+ Patch only verified mismatches, run docs/link/example checks, and record false positives so future runs do not repeat them.
82
+ Escalate when product behavior, generated docs, credentials, or screenshots need owner judgment.
83
+ ```
84
+
85
+ Good gates:
86
+
87
+ - examples run or match current output;
88
+ - link checker passes;
89
+ - generated files are not edited manually unless that is the project convention;
90
+ - false positives are recorded as loop state.
examples/bug-hunting-loop.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "Bug hunting",
3
+ "objective": "Find, validate, and report likely bugs with reproducible evidence instead of filing speculative agent-generated issues.",
4
+ "trigger": {
5
+ "type": "scheduled",
6
+ "cadence_or_event": "Weekly on modules with recent churn, and when error logs spike or flaky tests cluster."
7
+ },
8
+ "intake": {
9
+ "sources": ["error logs", "flaky tests", "issue labels", "support snippets", "recent diffs", "traces"],
10
+ "selection_rule": "Start only from concrete signals, search for duplicate issues first, and pursue candidates that reproduce in a safe environment."
11
+ },
12
+ "workspace": {
13
+ "isolation": "Branch, worktree, sandbox, or read-only mode depending on the target.",
14
+ "allowed_actions": ["run tests and local fixtures", "static search", "non-production reproduction", "file evidence-backed issues or small PRs"],
15
+ "disallowed_actions": ["production data access", "destructive fuzzing", "speculative mass issue creation", "broad refactors"]
16
+ },
17
+ "context": {
18
+ "required_files": ["module ownership docs", "safe reproduction commands"],
19
+ "runtime_sources": ["existing bug reports", "prior bug-hunt state and false positives"]
20
+ },
21
+ "agents": [
22
+ {
23
+ "role": "Scout",
24
+ "responsibility": "Discover suspicious signals and likely affected code paths."
25
+ },
26
+ {
27
+ "role": "Reproducer",
28
+ "responsibility": "Attempt minimal reproduction in a safe environment."
29
+ },
30
+ {
31
+ "role": "Minimizer",
32
+ "responsibility": "Reduce the reproduction to the smallest failing case."
33
+ },
34
+ {
35
+ "role": "Reporter",
36
+ "responsibility": "File evidence-backed issues, or a small PR with tests when the cause is clear."
37
+ }
38
+ ],
39
+ "verification": {
40
+ "gates": ["reports include reproducible steps or a clear trace link", "patches include a failing test or deterministic reproduction", "duplicate search is recorded", "expected vs actual behavior is grounded in docs or tests"],
41
+ "receipts": ["modules checked", "signals inspected", "reproduction commands", "expected and actual behavior", "final disposition"]
42
+ },
43
+ "state": {
44
+ "artifacts": ["bug-hunt log", "false-positive ledger"],
45
+ "update_rule": "Persist checked areas, reproductions, false positives, and dispositions so future runs do not repeat work."
46
+ },
47
+ "budget": {
48
+ "max_retries": 3,
49
+ "max_runtime_minutes": 90
50
+ },
51
+ "escalation": {
52
+ "conditions": ["production-only bug", "privacy-sensitive logs", "security-sensitive finding", "possible data loss", "fix needs architectural judgment"],
53
+ "destination": "Module owner via issue; private channel for security-sensitive findings"
54
+ },
55
+ "exit": {
56
+ "success": "A bug is reproduced and reported with evidence, or a small verified patch is opened.",
57
+ "stop_without_success": "The signal is classified as non-bug, retries are exhausted, or owner judgment is needed."
58
+ }
59
+ }
examples/ci-repair-loop.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "CI repair loop",
3
+ "objective": "Turn a failing CI signal into a small verified fix or a precise escalation note.",
4
+ "trigger": {
5
+ "type": "event",
6
+ "cadence_or_event": "A required CI check fails on an active pull request."
7
+ },
8
+ "intake": {
9
+ "sources": ["failed check name", "CI logs", "artifacts", "changed files", "recent successful run"],
10
+ "selection_rule": "Work only on failures with a reproducible command or a clear log-backed cause."
11
+ },
12
+ "workspace": {
13
+ "isolation": "Clean worktree based on the failing commit.",
14
+ "allowed_actions": ["inspect logs", "run test commands", "apply narrow fixes", "add focused tests"],
15
+ "disallowed_actions": ["weaken assertions", "delete tests", "broad formatting", "unrequested dependency upgrade"]
16
+ },
17
+ "context": {
18
+ "required_files": ["AGENTS.md", "README.md", "CONTRIBUTING.md"],
19
+ "runtime_sources": ["CI log URL", "failing command", "test artifacts"]
20
+ },
21
+ "agents": [
22
+ {
23
+ "role": "Investigator",
24
+ "responsibility": "Extract the failing command, error, and likely affected files."
25
+ },
26
+ {
27
+ "role": "Implementer",
28
+ "responsibility": "Make the smallest patch consistent with the failure evidence."
29
+ },
30
+ {
31
+ "role": "Verifier",
32
+ "responsibility": "Rerun the failing command and adjacent cheap checks."
33
+ },
34
+ {
35
+ "role": "Reporter",
36
+ "responsibility": "Summarize evidence and residual risk."
37
+ }
38
+ ],
39
+ "verification": {
40
+ "gates": ["original failing command passes", "patch is limited to the failure cause", "new behavior has a focused test when needed"],
41
+ "receipts": ["failing log excerpt", "commands run", "passing output", "diff summary"]
42
+ },
43
+ "state": {
44
+ "artifacts": ["CI repair progress note", "PR comment"],
45
+ "update_rule": "Record failed command, root-cause hypothesis, patch attempts, verification output, and unresolved blockers."
46
+ },
47
+ "budget": {
48
+ "max_retries": 3,
49
+ "max_runtime_minutes": 90
50
+ },
51
+ "escalation": {
52
+ "conditions": ["missing credentials", "third-party outage", "nondeterministic failure", "fix exceeds scope"],
53
+ "destination": "PR comment or issue assigned to the owning team"
54
+ },
55
+ "exit": {
56
+ "success": "The target check passes locally or in rerun CI.",
57
+ "stop_without_success": "Failure is flaky, not reproducible, blocked by environment, or requires owner approval."
58
+ }
59
+ }
examples/cost-control-loop.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "Cost control",
3
+ "objective": "Keep long-running agent workflows within budget by measuring usage, identifying waste, and proposing scoped efficiency improvements.",
4
+ "trigger": {
5
+ "type": "scheduled",
6
+ "cadence_or_event": "Daily or weekly usage review, and when spend, tokens, retries, or runtime exceed thresholds for a workflow."
7
+ },
8
+ "intake": {
9
+ "sources": ["token and model usage", "tool-call counts", "retry volume", "trace IDs", "billing exports", "recent workflow changes"],
10
+ "selection_rule": "Cluster usage by workflow, task type, model, and retry cause; investigate only clusters that exceed budget policy or baseline."
11
+ },
12
+ "workspace": {
13
+ "isolation": "Read-only access to traces, billing exports, dashboards, and workflow configs.",
14
+ "allowed_actions": ["analyze usage", "inspect traces", "propose config or prompt changes", "verify against representative tasks"],
15
+ "disallowed_actions": ["silent quality-reducing changes", "disabling verification gates", "production routing changes"]
16
+ },
17
+ "context": {
18
+ "required_files": ["budget policy", "accepted cost exceptions"],
19
+ "runtime_sources": ["baseline spend window", "trace samples", "recent prompt and harness changes"]
20
+ },
21
+ "agents": [
22
+ {
23
+ "role": "Analyst",
24
+ "responsibility": "Cluster usage by workflow, task type, model, tool, and retry cause."
25
+ },
26
+ {
27
+ "role": "Investigator",
28
+ "responsibility": "Inspect traces for context bloat, repeated failures, and missing stop conditions."
29
+ },
30
+ {
31
+ "role": "Optimizer",
32
+ "responsibility": "Propose the smallest change: smaller context, cheaper routing, caching, batching, or early exit."
33
+ },
34
+ {
35
+ "role": "Verifier",
36
+ "responsibility": "Rerun sample tasks or evals to confirm quality is preserved."
37
+ }
38
+ ],
39
+ "verification": {
40
+ "gates": ["before/after usage measured on a comparable task mix", "quality gates and evals still pass", "savings estimates include uncertainty and sample size", "verification and escalation remain intact"],
41
+ "receipts": ["baseline spend", "usage clusters", "trace samples", "before/after metrics", "verification results"]
42
+ },
43
+ "state": {
44
+ "artifacts": ["cost review report", "accepted-exception ledger"],
45
+ "update_rule": "Record baseline, suspected causes, proposed changes, and verification evidence after each review."
46
+ },
47
+ "budget": {
48
+ "max_retries": 2,
49
+ "max_runtime_minutes": 60
50
+ },
51
+ "escalation": {
52
+ "conditions": ["quality tradeoff required", "model-routing policy change", "customer impact", "unknown spend source"],
53
+ "destination": "Workflow owner with before/after evidence and rollout plan"
54
+ },
55
+ "exit": {
56
+ "success": "Spend returns below threshold, or a verified scoped optimization is proposed with evidence.",
57
+ "stop_without_success": "The cause is explained but the fix requires owner approval, or retries are exhausted."
58
+ }
59
+ }
examples/data-quality-loop.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "Data quality",
3
+ "objective": "Keep a recurring dataset or knowledge base trustworthy by validating each refresh against explicit quality rules before it is published.",
4
+ "trigger": {
5
+ "type": "event",
6
+ "cadence_or_event": "After each dataset or knowledge-base refresh, or nightly; also when the source schema changes or a freshness SLA is breached."
7
+ },
8
+ "intake": {
9
+ "sources": ["new dataset version", "schema and row counts", "prior accepted version", "quality rule definitions"],
10
+ "selection_rule": "Validate the latest version against the data contract and quality rules; quarantine on any hard-rule failure."
11
+ },
12
+ "workspace": {
13
+ "isolation": "Read access to the dataset, schema, profiling tools, and prior versions; quarantine area separate from production.",
14
+ "allowed_actions": ["run validation queries", "profile the data", "write a quality report", "quarantine a failing version"],
15
+ "disallowed_actions": ["edit source data", "publish to production", "relax rules without review"]
16
+ },
17
+ "context": {
18
+ "required_files": ["data contract or schema", "quality-rule definitions", "ownership map"],
19
+ "runtime_sources": ["load metrics", "profiling output", "diff against the last accepted version"]
20
+ },
21
+ "agents": [
22
+ {
23
+ "role": "Profiler",
24
+ "responsibility": "Compute counts, distributions, null rates, and freshness for the new version."
25
+ },
26
+ {
27
+ "role": "Validator",
28
+ "responsibility": "Check the profile against quality rules and the prior accepted baseline."
29
+ },
30
+ {
31
+ "role": "Investigator",
32
+ "responsibility": "Classify each failure as a defect, an accepted shift, or a rule bug."
33
+ },
34
+ {
35
+ "role": "Reporter",
36
+ "responsibility": "Record results, quarantine bad versions, and propose rule fixes."
37
+ }
38
+ ],
39
+ "verification": {
40
+ "gates": ["hard rules pass before a version is promotable", "distribution shifts beyond threshold are flagged with the delta", "every quarantine cites the failing rule and a sample", "accepted exceptions are recorded"],
41
+ "receipts": ["dataset version", "profile metrics", "rule results", "quarantine status with samples"]
42
+ },
43
+ "state": {
44
+ "artifacts": ["quality report", "accepted-exception ledger"],
45
+ "update_rule": "Persist the profile, rule results, and any new accepted exception so recurring shifts are not re-investigated."
46
+ },
47
+ "budget": {
48
+ "max_retries": 2,
49
+ "max_runtime_minutes": 90
50
+ },
51
+ "escalation": {
52
+ "conditions": ["ambiguous distribution shift", "schema change needing a data-contract update", "repeated upstream failure", "regulated or PII-bearing fields", "a rule that may itself be wrong"],
53
+ "destination": "Dataset owner via the data-quality channel"
54
+ },
55
+ "exit": {
56
+ "success": "The version is validated against all hard rules and ready for promotion.",
57
+ "stop_without_success": "The version is quarantined with evidence, or a shift needs owner judgment."
58
+ }
59
+ }
examples/dependency-triage-loop.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "Dependency triage",
3
+ "objective": "Classify dependency updates into safe patches, deferred upgrades, or human-review items with reproducible evidence.",
4
+ "trigger": {
5
+ "type": "scheduled",
6
+ "cadence_or_event": "Weekly, and on Dependabot, Renovate, or advisory-driven update PRs."
7
+ },
8
+ "intake": {
9
+ "sources": ["dependency update PRs", "release notes and changelogs", "security advisories", "lockfile diffs", "package audit output"],
10
+ "selection_rule": "Group updates by risk: safe patch, minor feature, major migration, security, or blocked; act automatically only on the safe group."
11
+ },
12
+ "workspace": {
13
+ "isolation": "Clean branch or worktree per update group.",
14
+ "allowed_actions": ["run package manager commands", "run tests, typechecks, and builds", "apply low-risk updates", "comment on PRs"],
15
+ "disallowed_actions": ["major version migrations", "runtime version changes", "security-policy changes", "broad multi-group upgrades"]
16
+ },
17
+ "context": {
18
+ "required_files": ["compatibility policy", "supported runtime versions"],
19
+ "runtime_sources": ["recent CI status", "known flaky tests", "prior triage state"]
20
+ },
21
+ "agents": [
22
+ {
23
+ "role": "Classifier",
24
+ "responsibility": "Group updates by risk, security relevance, version change, and blast radius."
25
+ },
26
+ {
27
+ "role": "Implementer",
28
+ "responsibility": "Apply low-risk updates and resolve lockfile conflicts."
29
+ },
30
+ {
31
+ "role": "Verifier",
32
+ "responsibility": "Run targeted tests, typechecks, builds, and package audits."
33
+ },
34
+ {
35
+ "role": "Reporter",
36
+ "responsibility": "Record accepted, deferred, and human-review updates with reasons."
37
+ }
38
+ ],
39
+ "verification": {
40
+ "gates": ["lockfile and manifest are consistent", "relevant tests, typecheck, build, and audit pass", "no skipped migration steps named in changelogs", "diff is limited to the intended group"],
41
+ "receipts": ["package versions and changelog links", "commands run with output", "deferred reasons", "reviewer questions"]
42
+ },
43
+ "state": {
44
+ "artifacts": ["triage report comment", "processed-update ledger"],
45
+ "update_rule": "Record processed update IDs, verification evidence, and deferral reasons after each group."
46
+ },
47
+ "budget": {
48
+ "max_retries": 2,
49
+ "max_runtime_minutes": 60
50
+ },
51
+ "escalation": {
52
+ "conditions": ["major version upgrade", "runtime requirement change", "security advisory with product impact", "licensing concern", "repeated verification failure"],
53
+ "destination": "Issue assigned to the repository owner with the blocked group and evidence"
54
+ },
55
+ "exit": {
56
+ "success": "Safe updates are verified and merged or review-ready, and risky updates are deferred with reasons.",
57
+ "stop_without_success": "Verification fails repeatedly or remaining updates all require human review."
58
+ }
59
+ }