KrisSimon commited on
Commit
423dc73
·
verified ·
1 Parent(s): 414381b

Upload ARO Coder 4-bit (distill_student)

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. promotion_gate.json +90 -90
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5226aee5f953c9315db787c0e49cbeaf13da669f54b79bcd204ea90d9fc2f70b
3
  size 4607835164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:453768b2f59b7887a520eaf3c7552377059927bb0b98c7aab78fcb85f205b4ae
3
  size 4607835164
promotion_gate.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "reply_rate": 1.0,
3
  "empty_think_rate": 0.0,
4
- "syntax_pass_rate": 0.5806451612903226,
5
  "tool_leak_rate": 0.0,
6
  "url_contam_rate": 0.0,
7
  "total": 100,
8
- "with_code": 93,
9
  "results": [
10
  {
11
  "idx": 1,
12
  "cat": "repl_oneliner",
13
  "prompt": "Write a single ARO line that logs the message 'Hello, World!' to the console.",
14
- "reply": "```aro\nLog \"Hello, World!\" to the <console>.\n```",
15
  "empty_think": false,
16
  "has_code": true,
17
  "tool_leak": false,
@@ -21,7 +21,7 @@
21
  "idx": 2,
22
  "cat": "repl_oneliner",
23
  "prompt": "Write one ARO statement that retrieves the current time from the clock.",
24
- "reply": "```aro\nRetrieve the <current-time> from the <clock>.\n```",
25
  "empty_think": false,
26
  "has_code": true,
27
  "tool_leak": false,
@@ -31,7 +31,7 @@
31
  "idx": 3,
32
  "cat": "repl_oneliner",
33
  "prompt": "Write a single line that computes the length of the string 'banana'.",
34
- "reply": "Compute the <length: length> from the <string: \"banana\">.",
35
  "empty_think": false,
36
  "has_code": false,
37
  "tool_leak": false,
@@ -41,7 +41,7 @@
41
  "idx": 4,
42
  "cat": "repl_oneliner",
43
  "prompt": "Write one ARO statement that converts the string 'hello' to uppercase.",
44
- "reply": "```aro\nTransform the <upper: uppercase> from the <string: \"hello\">.\n```",
45
  "empty_think": false,
46
  "has_code": true,
47
  "tool_leak": false,
@@ -51,7 +51,7 @@
51
  "idx": 5,
52
  "cat": "repl_oneliner",
53
  "prompt": "Write one line that hashes the password 'secret'.",
54
- "reply": "Use the `Hash` action: `Hash the <password> from \"secret\".`",
55
  "empty_think": false,
56
  "has_code": false,
57
  "tool_leak": false,
@@ -71,7 +71,7 @@
71
  "idx": 7,
72
  "cat": "repl_oneliner",
73
  "prompt": "Write one line that retrieves the git status.",
74
- "reply": "Read the <status> from the <git: status>.",
75
  "empty_think": false,
76
  "has_code": false,
77
  "tool_leak": false,
@@ -91,7 +91,7 @@
91
  "idx": 9,
92
  "cat": "repl_oneliner",
93
  "prompt": "Write one ARO statement that reads the file 'config.yaml' from the filesystem.",
94
- "reply": "```aro\nRead the <config> from the <file: \"config.yaml\">.\n```",
95
  "empty_think": false,
96
  "has_code": true,
97
  "tool_leak": false,
@@ -111,7 +111,7 @@
111
  "idx": 11,
112
  "cat": "repl_block",
113
  "prompt": "Write a 3-statement ARO snippet that reads a file, uppercases it, and logs the result.",
114
- "reply": "```aro\nRead the <content> from the <file: \"input.txt\">.\nCompute the <upper: uppercase> from the <content>.\nLog <upper> to the <console>.\n```",
115
  "empty_think": false,
116
  "has_code": true,
117
  "tool_leak": false,
@@ -121,7 +121,7 @@
121
  "idx": 12,
122
  "cat": "repl_block",
123
  "prompt": "Write a 4-statement snippet that fetches users from a repository, computes the count, and logs it.",
124
- "reply": "```aro\nRetrieve the <users> from the <user-repository>.\nCompute the <count> from the <users: length>.\nLog the <count> to the <console>.\nReturn an <OK: status> for the <result>.\n```",
125
  "empty_think": false,
126
  "has_code": true,
127
  "tool_leak": false,
@@ -131,7 +131,7 @@
131
  "idx": 13,
132
  "cat": "repl_block",
133
  "prompt": "Write an ARO snippet that stages all changes, commits with message 'wip', and pushes.",
134
- "reply": "```aro\n(StageAndPush: Git Workflow) {\n Stage the <changes> to the <git>.\n Commit the <changes> to the <git> with \"wip\".\n Push the <changes> to the <git> with \"wip\".\n Return an <OK: status> for the <push>.\n}\n```",
135
  "empty_think": false,
136
  "has_code": true,
137
  "tool_leak": false,
@@ -141,7 +141,7 @@
141
  "idx": 14,
142
  "cat": "repl_block",
143
  "prompt": "Write a 3-statement snippet that creates a list, computes its length, and logs the length.",
144
- "reply": "```aro\nExtract the <items> from the <input>.\nCompute the <length> from the <items>.\nLog the <length> to the <console>.\n```",
145
  "empty_think": false,
146
  "has_code": true,
147
  "tool_leak": false,
@@ -151,7 +151,7 @@
151
  "idx": 15,
152
  "cat": "repl_block",
153
  "prompt": "Write a snippet that extracts a name from an event, uppercases it, and stores it back in a variable.",
154
- "reply": "```aro\nExtract the <name> from the <event: name>.\nCompute the <upper: uppercase> from the <name>.\nStore the <upper> into the <variable>.\n```",
155
  "empty_think": false,
156
  "has_code": true,
157
  "tool_leak": false,
@@ -161,7 +161,7 @@
161
  "idx": 16,
162
  "cat": "repl_block",
163
  "prompt": "Write a 3-statement snippet that computes 3 + 4, multiplies by 2, and logs the result.",
164
- "reply": "```aro\nCompute the <sum> from <a> + <b>.\nCompute the <doubled> from <sum> * 2.\nLog <doubled> to the <console>.\n```",
165
  "empty_think": false,
166
  "has_code": true,
167
  "tool_leak": false,
@@ -171,7 +171,7 @@
171
  "idx": 17,
172
  "cat": "repl_block",
173
  "prompt": "Write a snippet that reads two numbers and returns their sum.",
174
- "reply": "```aro\n(AddTwoNumbers: Example) {\n Extract the <a> from the <input: a>.\n Extract the <b> from the <input: b>.\n Compute the <sum> from <a> + <b>.\n Return an <OK: status> with <sum>.\n}\n```",
175
  "empty_think": false,
176
  "has_code": true,
177
  "tool_leak": false,
@@ -181,7 +181,7 @@
181
  "idx": 18,
182
  "cat": "repl_block",
183
  "prompt": "Write a snippet that filters a list of users where age > 18 and counts them.",
184
- "reply": "```aro\n(FilterAdults: User API) {\n Extract the <users> from the <request: body>.\n Filter the <adults> from the <users> where <age> > 18.\n Count the <count> from the <adults>.\n Return an <OK: status> with { count: <count> }.\n}\n```",
185
  "empty_think": false,
186
  "has_code": true,
187
  "tool_leak": false,
@@ -191,7 +191,7 @@
191
  "idx": 19,
192
  "cat": "repl_block",
193
  "prompt": "Write a snippet that joins two lists and stores the result as <combined>.",
194
- "reply": "```aro\nJoin the <list-a> with the <list-b> into the <combined>.\n```",
195
  "empty_think": false,
196
  "has_code": true,
197
  "tool_leak": false,
@@ -201,7 +201,7 @@
201
  "idx": 20,
202
  "cat": "repl_block",
203
  "prompt": "Write a snippet that parses a JSON string and extracts the 'name' field.",
204
- "reply": "```aro\n(ExtractName: JSON Parser) {\n Extract the <json> from the <input: json>.\n Parse the <parsed> from the <json>.\n Extract the <name> from the <parsed: name>.\n Return an <OK: status> with <name>.\n}\n```",
205
  "empty_think": false,
206
  "has_code": true,
207
  "tool_leak": false,
@@ -221,7 +221,7 @@
221
  "idx": 22,
222
  "cat": "user_action",
223
  "prompt": "Write a user-defined action 'Greet' that takes a name and returns a greeting string.",
224
- "reply": "```aro\n(Greet: Greeting) {\n Extract the <name> from the <input: name>.\n Compute the <greeting> from \"Hello, \" ++ <name>.\n Return an <OK: status> with <greeting>.\n}\n```",
225
  "empty_think": false,
226
  "has_code": true,
227
  "tool_leak": false,
@@ -231,7 +231,7 @@
231
  "idx": 23,
232
  "cat": "user_action",
233
  "prompt": "Write a user-defined action 'AddTwoNumbers' that takes two numbers and returns their sum.",
234
- "reply": "```aro\n(AddTwoNumbers: Math) {\n Extract the <a> from the <input: a>.\n Extract the <b> from the <input: b>.\n Compute the <sum> from <a> + <b>.\n Return an <OK: status> with <sum>.\n}\n```",
235
  "empty_think": false,
236
  "has_code": true,
237
  "tool_leak": false,
@@ -241,7 +241,7 @@
241
  "idx": 24,
242
  "cat": "user_action",
243
  "prompt": "Write a user-defined action 'ValidateEmail' that takes an email string and returns OK or Error.",
244
- "reply": "```aro\n(ValidateEmail: Email Validation) {\n Extract the <email> from the <input: email>.\n Validate the <email> against the <email-pattern>.\n Return an <OK: status> for the <valid: email>.\n}\n```",
245
  "empty_think": false,
246
  "has_code": true,
247
  "tool_leak": false,
@@ -251,7 +251,7 @@
251
  "idx": 25,
252
  "cat": "user_action",
253
  "prompt": "Write a user-defined action 'Square' that takes a number and returns its square.",
254
- "reply": "```aro\n(Square: Action) {\n Extract the <n> from the <input: number>.\n Compute the <square> from <n> * <n>.\n Return an <OK: status> with { square: <square> }.\n}\n```",
255
  "empty_think": false,
256
  "has_code": true,
257
  "tool_leak": false,
@@ -261,7 +261,7 @@
261
  "idx": 26,
262
  "cat": "user_action",
263
  "prompt": "Write a user-defined action 'FormatDate' that takes a date and a format string.",
264
- "reply": "```aro\n(FormatDate: Date Formatter) {\n Extract the <date> from the <input: date>.\n Extract the <format> from the <input: format>.\n Format the <formatted> from the <date> with <format>.\n Return an <OK: status> with <formatted>.\n}\n```",
265
  "empty_think": false,
266
  "has_code": true,
267
  "tool_leak": false,
@@ -271,7 +271,7 @@
271
  "idx": 27,
272
  "cat": "user_action",
273
  "prompt": "Write a user-defined action 'CountWords' that takes a string and returns the word count.",
274
- "reply": "```aro\n(CountWords: String Processor) {\n Extract the <text> from the <input: text>.\n Split the <words> from the <text> by whitespace.\n Count the <word-count> from the <words>.\n Return an <OK: status> with { count: <word-count> }.\n}\n```",
275
  "empty_think": false,
276
  "has_code": true,
277
  "tool_leak": false,
@@ -281,7 +281,7 @@
281
  "idx": 28,
282
  "cat": "user_action",
283
  "prompt": "Write a user-defined action 'PickRandom' that takes a list and returns a random element.",
284
- "reply": "```aro\n(PickRandom: Action) {\n Extract the <list> from the <input>.\n Compute the <random-element> from the <list: collections.pick-random>.\n Return an <OK: status> with <random-element>.\n}\n```",
285
  "empty_think": false,
286
  "has_code": true,
287
  "tool_leak": false,
@@ -291,7 +291,7 @@
291
  "idx": 29,
292
  "cat": "user_action",
293
  "prompt": "Write a user-defined action 'Capitalize' that takes a string and uppercases its first letter.",
294
- "reply": "```aro\n(Capitalize: String Transformer) {\n Extract the <input> from the <input: string>.\n Compute the <capitalized> from <input> with <capitalize>.\n Return an <OK: status> with <capitalized>.\n}\n```",
295
  "empty_think": false,
296
  "has_code": true,
297
  "tool_leak": false,
@@ -321,7 +321,7 @@
321
  "idx": 32,
322
  "cat": "event_handler",
323
  "prompt": "Write an event handler for OrderPlaced that decrements inventory.",
324
- "reply": "```aro\n(OrderPlaced: OrderPlaced Handler) {\n Extract the <order> from the <event: order>.\n Extract the <item> from the <order: item>.\n Extract the <quantity> from the <order: quantity>.\n Decrement the <inventory> for the <item> by <quantity>.\n Return an <OK: status> for the <inventory-update>.\n}\n```",
325
  "empty_think": false,
326
  "has_code": true,
327
  "tool_leak": false,
@@ -331,7 +331,7 @@
331
  "idx": 33,
332
  "cat": "event_handler",
333
  "prompt": "Write an event handler for PaymentFailed that logs the error and notifies the user.",
334
- "reply": "```aro\n(PaymentFailed Handler: Payment API) {\n Extract the <error> from the <event: error>.\n Log <error> to the <console>.\n Notify the <user> with <error>.\n Return an <OK: status> for the <handler>.\n}\n```",
335
  "empty_think": false,
336
  "has_code": true,
337
  "tool_leak": false,
@@ -341,7 +341,7 @@
341
  "idx": 34,
342
  "cat": "event_handler",
343
  "prompt": "Write an event handler for FileChanged that re-reads the configuration.",
344
- "reply": "```aro\n(File Changed: Config Reload) {\n Extract the <file> from the <event: file>.\n Read the <config> from the <file>.\n Store the <config> into the <config-cache>.\n Return an <OK: status> for the <reload>.\n}\n```",
345
  "empty_think": false,
346
  "has_code": true,
347
  "tool_leak": false,
@@ -351,7 +351,7 @@
351
  "idx": 35,
352
  "cat": "event_handler",
353
  "prompt": "Write an event handler for LoginAttempt that records the IP address.",
354
- "reply": "```aro\n(Send Login Attempt: LoginAttempt Handler) {\n Extract the <ip> from the <event: ip>.\n Log <ip> to the <console>.\n Return an <OK: status> for the <attempt>.\n}\n```",
355
  "empty_think": false,
356
  "has_code": true,
357
  "tool_leak": false,
@@ -361,7 +361,7 @@
361
  "idx": 36,
362
  "cat": "event_handler",
363
  "prompt": "Write an event handler for GitPush that triggers a CI build.",
364
- "reply": "```aro\n(GitPush: Git Event Handler) {\n Extract the <branch> from the <event: branch>.\n Extract the <commit> from the <event: commit>.\n Extract the <repository> from the <event: repository>.\n Trigger the <ci-build> with { branch: <branch>, commit: <commit>, repository: <repository> }.\n Return an <OK: status> for the <build-triggered>.\n}\n```",
365
  "empty_think": false,
366
  "has_code": true,
367
  "tool_leak": false,
@@ -371,7 +371,7 @@
371
  "idx": 37,
372
  "cat": "event_handler",
373
  "prompt": "Write an event handler for SubscriptionExpired that downgrades the account.",
374
- "reply": "```aro\n(DowngradeAccount: SubscriptionExpired Handler) {\n Extract the <account> from the <event: account>.\n Extract the <plan> from the <account: plan>.\n Downgrade the <account> to the <plan: basic>.\n Return an <OK: status> for the <downgrade>.\n}\n```",
375
  "empty_think": false,
376
  "has_code": true,
377
  "tool_leak": false,
@@ -381,7 +381,7 @@
381
  "idx": 38,
382
  "cat": "event_handler",
383
  "prompt": "Write an event handler for ServerStarted that warms up the cache.",
384
- "reply": "```aro\n(ServerStarted: Cache Warmup) {\n Extract the <server> from the <event: server>.\n Warm the <cache> for the <server>.\n Return an <OK: status> for the <warmup>.\n}\n```",
385
  "empty_think": false,
386
  "has_code": true,
387
  "tool_leak": false,
@@ -391,7 +391,7 @@
391
  "idx": 39,
392
  "cat": "event_handler",
393
  "prompt": "Write an event handler for MessageReceived that echoes the message back.",
394
- "reply": "```aro\n(MessageEcho: MessageReceived Handler) {\n Extract the <message> from the <event: message>.\n Log <message> to the <console>.\n Return an <OK: status> for the <echo>.\n}\n```",
395
  "empty_think": false,
396
  "has_code": true,
397
  "tool_leak": false,
@@ -401,7 +401,7 @@
401
  "idx": 40,
402
  "cat": "event_handler",
403
  "prompt": "Write an event handler for ImageUploaded that generates a thumbnail.",
404
- "reply": "```aro\n(ImageUploaded: Event Handler) {\n Extract the <image> from the <event: image>.\n Create the <thumbnail> from the <image>.\n Store the <thumbnail> into the <thumbnail-repository>.\n Return an <OK: status> for the <thumbnail-generation>.\n}\n```",
405
  "empty_think": false,
406
  "has_code": true,
407
  "tool_leak": false,
@@ -411,7 +411,7 @@
411
  "idx": 41,
412
  "cat": "application",
413
  "prompt": "Write a complete ARO Application-Start that prints Hello and exits.",
414
- "reply": "```aro\n(Application-Start: Example) {\n Log \"Hello\" to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
415
  "empty_think": false,
416
  "has_code": true,
417
  "tool_leak": false,
@@ -421,7 +421,7 @@
421
  "idx": 42,
422
  "cat": "application",
423
  "prompt": "Write a complete Application-Start that starts an HTTP server on port 8080.",
424
- "reply": "```aro\n(Application-Start: HTTP Server) {\n Start the <http-server> with <port: 8080>.\n Return an <OK: status> for the <startup>.\n}\n```",
425
  "empty_think": false,
426
  "has_code": true,
427
  "tool_leak": false,
@@ -431,7 +431,7 @@
431
  "idx": 43,
432
  "cat": "application",
433
  "prompt": "Write a complete Application-Start that watches a directory for changes.",
434
- "reply": "```aro\n(Application-Start: Watcher) {\n Log \"Starting watcher...\" to the <console>.\n Start the <file-monitor> with { path: \"./watched\" }.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n```",
435
  "empty_think": false,
436
  "has_code": true,
437
  "tool_leak": false,
@@ -451,7 +451,7 @@
451
  "idx": 45,
452
  "cat": "application",
453
  "prompt": "Write a complete Application-Start that opens a TCP echo server on port 9000.",
454
- "reply": "```aro\n(Application-Start: Echo Server) {\n Start the <tcp-server> with { port: 9000, echo: true }.\n Log \"Echo server started on port 9000\" to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
455
  "empty_think": false,
456
  "has_code": true,
457
  "tool_leak": false,
@@ -461,7 +461,7 @@
461
  "idx": 46,
462
  "cat": "application",
463
  "prompt": "Write a complete Application-Start that starts a WebSocket server and keeps it alive.",
464
- "reply": "```aro\n(Application-Start: WebSocket App) {\n Start the <websocket-server> with <websocket-config>.\n Keepalive the <application> for the <websocket-events>.\n Return an <OK: status> for the <startup>.\n}\n```",
465
  "empty_think": false,
466
  "has_code": true,
467
  "tool_leak": false,
@@ -471,7 +471,7 @@
471
  "idx": 47,
472
  "cat": "application",
473
  "prompt": "Write a complete Application-Start that connects to a database and runs a single query.",
474
- "reply": "```aro\n(Application-Start: Database App) {\n Connect the <connection> to the <database: \"localhost\">.\n Query the <result> from the <connection: \"SELECT * FROM users\">.\n Return an <OK: status> for the <startup>.\n}\n```",
475
  "empty_think": false,
476
  "has_code": true,
477
  "tool_leak": false,
@@ -481,7 +481,7 @@
481
  "idx": 48,
482
  "cat": "application",
483
  "prompt": "Write a complete Application-Start that reads command-line parameters and prints them.",
484
- "reply": "```aro\n(Application-Start: My App) {\n Extract the <args> from the <command-line: arguments>.\n Log \"Arguments: \" to the <console>.\n Log <args> to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
485
  "empty_think": false,
486
  "has_code": true,
487
  "tool_leak": false,
@@ -491,7 +491,7 @@
491
  "idx": 49,
492
  "cat": "application",
493
  "prompt": "Write a complete Application-Start that loads a configuration file and logs it.",
494
- "reply": "```aro\n(Application-Start: My App) {\n Read the <config> from the <file: \"config.json\">.\n Log the <config> to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
495
  "empty_think": false,
496
  "has_code": true,
497
  "tool_leak": false,
@@ -501,7 +501,7 @@
501
  "idx": 50,
502
  "cat": "application",
503
  "prompt": "Write a complete Application-Start that prints the current git branch.",
504
- "reply": "```aro\n(Application-Start: My App) {\n Log \"Starting...\" to the <console>.\n Start the <http-server> with <contract>.\n Return an <OK: status> for the <startup>.\n}\n```",
505
  "empty_think": false,
506
  "has_code": true,
507
  "tool_leak": false,
@@ -521,7 +521,7 @@
521
  "idx": 52,
522
  "cat": "http_api",
523
  "prompt": "Write the openapi.yaml plus feature set for a POST /products endpoint.",
524
- "reply": "**openapi.yaml**\n```yaml\nopenapi: 3.0.3\ninfo:\n title: Product API\n description: A simple API for managing products\n version: 1.0.0\nservers:\n - url: http://localhost:8080\npaths:\n /products:\n post:\n operationId: createProduct\n summary: Create a new product\n requestBody:\n required: true\n content:\n application/json:\n schema:\n $ref: '#/components/schemas/Product'\n responses:\n '201':\n description: Created\n ",
525
  "empty_think": false,
526
  "has_code": true,
527
  "tool_leak": false,
@@ -541,7 +541,7 @@
541
  "idx": 54,
542
  "cat": "http_api",
543
  "prompt": "Write a feature set for createOrder that validates the request body and emits OrderCreated.",
544
- "reply": "```aro\n(createOrder: Order API) {\n Extract the <request-body> from the <request: body>.\n Validate the <request-body> for the <order-schema>.\n Emit an <OrderCreated: event> with <request-body>.\n Return an <OK: status> for the <order-creation>.\n}\n```",
545
  "empty_think": false,
546
  "has_code": true,
547
  "tool_leak": false,
@@ -551,7 +551,7 @@
551
  "idx": 55,
552
  "cat": "http_api",
553
  "prompt": "Write a feature set for deleteSession that removes a session from the sessions-repository.",
554
- "reply": "```aro\n(deleteSession: Session API) {\n Extract the <session-id> from the <request: body>.\n Delete the <session> from the <sessions-repository> where <id> = <session-id>.\n Return an <OK: status> for the <deletion>.\n}\n```",
555
  "empty_think": false,
556
  "has_code": true,
557
  "tool_leak": false,
@@ -561,7 +561,7 @@
561
  "idx": 56,
562
  "cat": "http_api",
563
  "prompt": "Write a feature set for searchProducts that takes a query parameter and filters results.",
564
- "reply": "```aro\n(SearchProducts: Product API) {\n Extract the <query> from the <request: query>.\n Retrieve the <products> from the <product-repository>.\n Filter the <filtered-products> from the <products> where <name> contains <query>.\n Return an <OK: status> with <filtered-products>.\n}\n```",
565
  "empty_think": false,
566
  "has_code": true,
567
  "tool_leak": false,
@@ -571,7 +571,7 @@
571
  "idx": 57,
572
  "cat": "http_api",
573
  "prompt": "Write a feature set for updateProfile that patches a user record.",
574
- "reply": "```aro\n(UpdateProfile: User API) {\n Extract the <userId> from the <pathParameters: id>.\n Extract the <updates> from the <request: body>.\n Retrieve the <user> from the <user-repository> where id = <userId>.\n Patch the <user> with <updates>.\n Store the <updated-user> into the <user-repository>.\n Return an <OK: status> with <updated-user>.\n}\n```",
575
  "empty_think": false,
576
  "has_code": true,
577
  "tool_leak": false,
@@ -581,7 +581,7 @@
581
  "idx": 58,
582
  "cat": "http_api",
583
  "prompt": "Write a feature set for healthCheck that returns OK.",
584
- "reply": "```aro\n(HealthCheck: Health API) {\n Return an <OK: status> for the <health-check>.\n}\n```",
585
  "empty_think": false,
586
  "has_code": true,
587
  "tool_leak": false,
@@ -611,7 +611,7 @@
611
  "idx": 61,
612
  "cat": "repository",
613
  "prompt": "Write a repository observer for the users-repository that logs every change.",
614
- "reply": "```aro\n(UsersRepositoryObserver: Repository Observer) {\n Extract the <event> from the <repository: event>.\n Extract the <user> from the <event: user>.\n Log <user> to the <console>.\n Return an <OK: status> for the <observation>.\n}\n```",
615
  "empty_think": false,
616
  "has_code": true,
617
  "tool_leak": false,
@@ -621,7 +621,7 @@
621
  "idx": 62,
622
  "cat": "repository",
623
  "prompt": "Write a repository observer for orders-repository that emits OrderUpdated when records change.",
624
- "reply": "```aro\n(OrderUpdated: orders-repository Observer) {\n Extract the <record> from the <orders-repository>.\n Emit a <OrderUpdated: event> with <record>.\n Return an <OK: status> for the <update>.\n}\n```",
625
  "empty_think": false,
626
  "has_code": true,
627
  "tool_leak": false,
@@ -651,7 +651,7 @@
651
  "idx": 65,
652
  "cat": "repository",
653
  "prompt": "Write an observer that triggers when a user is deleted from the user-repository.",
654
- "reply": "```aro\n(DeleteUserObserver: User Deleted Observer) {\n Extract the <user> from the <event: user>.\n Log \"User deleted: \" ++ <user: name> to the <console>.\n Return an <OK: status> for the <deletion>.\n}\n```",
655
  "empty_think": false,
656
  "has_code": true,
657
  "tool_leak": false,
@@ -661,7 +661,7 @@
661
  "idx": 66,
662
  "cat": "repository",
663
  "prompt": "Write a feature set that updates a record in the inventory-repository.",
664
- "reply": "```aro\n(UpdateInventory: Inventory API) {\n Extract the <id> from the <request: id>.\n Extract the <updates> from the <request: updates>.\n Retrieve the <inventory> from the <inventory-repository> where <id> = <id>.\n Update the <inventory> with <updates>.\n Store the <inventory> into the <inventory-repository>.\n Return an <OK: status> with <inventory>.\n}\n```",
665
  "empty_think": false,
666
  "has_code": true,
667
  "tool_leak": false,
@@ -671,7 +671,7 @@
671
  "idx": 67,
672
  "cat": "repository",
673
  "prompt": "Write a state-guarded handler that triggers only on UserUpdated where role = admin.",
674
- "reply": "```aro\n(AdminUserUpdated: UserUpdated Handler) {\n Extract the <user> from the <event: user>.\n Extract the <role> from the <user: role>.\n When <role> = \"admin\" {\n Log \"Admin user updated: \" ++ <user: id> to the <console>.\n Return an <OK: status> for the <admin-update>.\n }\n Return an <OK: status> for the <non-admin-update>.\n}\n```",
675
  "empty_think": false,
676
  "has_code": true,
677
  "tool_leak": false,
@@ -681,7 +681,7 @@
681
  "idx": 68,
682
  "cat": "repository",
683
  "prompt": "Write a feature set that bulk-imports a list of users into the user-repository.",
684
- "reply": "```aro\n(BulkImportUsers: User API) {\n Extract the <users> from the <request: body>.\n For each <user> in <users> {\n Create the <user> with <user>.\n }\n Return an <OK: status> with <users>.\n}\n```",
685
  "empty_think": false,
686
  "has_code": true,
687
  "tool_leak": false,
@@ -691,7 +691,7 @@
691
  "idx": 69,
692
  "cat": "repository",
693
  "prompt": "Write a feature set that publishes the count of orders as a global variable.",
694
- "reply": "```aro\n(CountOrders: Order API) {\n Retrieve the <orders> from the <order-repository>.\n Count the <count> from the <orders>.\n Store the <count> into the <global: order-count>.\n Return an <OK: status> with <count>.\n}\n```",
695
  "empty_think": false,
696
  "has_code": true,
697
  "tool_leak": false,
@@ -701,7 +701,7 @@
701
  "idx": 70,
702
  "cat": "repository",
703
  "prompt": "Write a repository observer that retries on failure.",
704
- "reply": "```aro\n(ObserveUserRepository: Repository Observer) {\n Extract the <user> from the <user-repository>.\n Retry the <operation> on failure with <attempts: 3>.\n Return an <OK: status> for the <observation>.\n}\n```",
705
  "empty_think": false,
706
  "has_code": true,
707
  "tool_leak": false,
@@ -711,7 +711,7 @@
711
  "idx": 71,
712
  "cat": "refactor",
713
  "prompt": "Refactor this snippet to use the qualifier-as-name syntax: `Compute the <length> from <a>. Compute the <length> from <b>.`",
714
- "reply": "```aro\nCompute the <length: length> from <a>.\nCompute the <length: length> from <b>.\n```",
715
  "empty_think": false,
716
  "has_code": true,
717
  "tool_leak": false,
@@ -721,7 +721,7 @@
721
  "idx": 72,
722
  "cat": "refactor",
723
  "prompt": "Fix this snippet so it parses: `Log Hello to console.`",
724
- "reply": "```aro\nLog \"Hello\" to the <console>.\n```",
725
  "empty_think": false,
726
  "has_code": true,
727
  "tool_leak": false,
@@ -751,7 +751,7 @@
751
  "idx": 75,
752
  "cat": "refactor",
753
  "prompt": "Rewrite this ARO snippet to use lazy evaluation idioms: `Compute the <a> from 1+1. Compute the <b> from <a>+1. Log <b> to the <console>.`",
754
- "reply": "```aro\nCompute the <a> from 1+1.\nCompute the <b> from <a>+1.\nLog <b> to the <console>.\n```",
755
  "empty_think": false,
756
  "has_code": true,
757
  "tool_leak": false,
@@ -761,7 +761,7 @@
761
  "idx": 76,
762
  "cat": "refactor",
763
  "prompt": "Split this monolithic feature set into one Application-Start and one event handler: `(Foo: My App) { Log \"start\" to <console>. Emit a <Started: event>. Log \"after\" to <console>. }`",
764
- "reply": "```aro\n(Application-Start: My App) {\n Log \"Starting...\" to the <console>.\n Start the <http-server> with <contract>.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n\n(Started: Event Handler) {\n Log \"Started\" to the <console>.\n Return an <OK: status> for the <event>.\n}\n```",
765
  "empty_think": false,
766
  "has_code": true,
767
  "tool_leak": false,
@@ -771,7 +771,7 @@
771
  "idx": 77,
772
  "cat": "refactor",
773
  "prompt": "Add a When guard to this handler so it only runs for admin users: `(OnUserUpdated: UserUpdated Handler) { Log <event> to the <console>. Return an <OK: status> for <log>. }`",
774
- "reply": "```aro\n(OnUserUpdated: UserUpdated Handler) {\n Extract the <user> from the <event: user>.\n When <user: role> = \"admin\" {\n Log <event> to the <console>.\n Return an <OK: status> for <log>.\n }\n Return an <OK: status> for <log>.\n}\n```",
775
  "empty_think": false,
776
  "has_code": true,
777
  "tool_leak": false,
@@ -781,7 +781,7 @@
781
  "idx": 78,
782
  "cat": "refactor",
783
  "prompt": "Replace direct repository writes with an emitted event in this feature set: `(saveUser: User API) { Store the <user> in the <user-repository>. Return an <OK: status>. }`",
784
- "reply": "```aro\n(saveUser: User API) {\n Extract the <user> from the <request: body>.\n Emit a <UserSaved: event> with <user>.\n Return an <OK: status> for the <save>.\n}\n```",
785
  "empty_think": false,
786
  "has_code": true,
787
  "tool_leak": false,
@@ -791,7 +791,7 @@
791
  "idx": 79,
792
  "cat": "refactor",
793
  "prompt": "Convert this REPL one-liner into a proper feature set: `Log \"Hi\" to the <console>.`",
794
- "reply": "```aro\n(Application-Start: Example) {\n Log \"Hi\" to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
795
  "empty_think": false,
796
  "has_code": true,
797
  "tool_leak": false,
@@ -801,7 +801,7 @@
801
  "idx": 80,
802
  "cat": "refactor",
803
  "prompt": "Refactor a duplicated three-line greeting flow into a single user-defined action called Greet.",
804
- "reply": "```aro\n(Greet: Greeting) {\n Extract the <name> from the <input: name>.\n Create the <greeting> with \"Hello, \" ++ <name> ++ \"!\".\n Return an <OK: status> with <greeting>.\n}\n```",
805
  "empty_think": false,
806
  "has_code": true,
807
  "tool_leak": false,
@@ -811,7 +811,7 @@
811
  "idx": 81,
812
  "cat": "explain",
813
  "prompt": "What does the Keepalive action do in ARO?",
814
- "reply": "The `Keepalive` action keeps the application running by waiting for events or signals. It's used to keep the application alive while waiting for events to process.\n\n```aro\nKeepalive the <application> for the <events>.\n```",
815
  "empty_think": false,
816
  "has_code": true,
817
  "tool_leak": false,
@@ -821,7 +821,7 @@
821
  "idx": 82,
822
  "cat": "explain",
823
  "prompt": "Explain the difference between Application-Start and an event handler.",
824
- "reply": "Application-Start is the entry point for the application. It runs once when the application starts and is responsible for initializing the application.\n\nEvent handlers, on the other hand, are triggered by specific events. They run when an event occurs, such as a user action or a system event.\n\nApplication-Start is the entry point for the application. It runs once when the application starts and is responsible for initializing the application.\n\nEvent handlers are triggered by specific events. The",
825
  "empty_think": false,
826
  "has_code": false,
827
  "tool_leak": false,
@@ -831,7 +831,7 @@
831
  "idx": 83,
832
  "cat": "explain",
833
  "prompt": "What is the difference between OWN and EXPORT action roles?",
834
- "reply": "The `OWN` role is used for actions that are part of the application's internal logic, such as processing data, performing calculations, or managing state. These actions are typically used within the application's feature sets and are not exposed to external systems.\n\nThe `EXPORT` role is used for actions that are intended to be used by external systems or services. These actions are typically used to expose functionality to external systems, such as APIs or event handlers.\n\nHere's an example of ",
835
  "empty_think": false,
836
  "has_code": true,
837
  "tool_leak": false,
@@ -841,7 +841,7 @@
841
  "idx": 84,
842
  "cat": "explain",
843
  "prompt": "How does ARO's error philosophy work? What is 'code is the error message'?",
844
- "reply": "ARO's error philosophy is that the code itself is the error message. The section states: \"The code is the error message \u2014 the compiler emits a clear error for every failure.\" This means that the compiler does not emit a generic error message like \"error: invalid syntax\" but instead emits a clear error message that points directly to the source of the error.\n\nFor example, if the code has a syntax error, the compiler will emit a clear error message that points directly to the source of the error. ",
845
  "empty_think": false,
846
  "has_code": false,
847
  "tool_leak": false,
@@ -851,9 +851,9 @@
851
  "idx": 85,
852
  "cat": "explain",
853
  "prompt": "Explain what the openapi.yaml file does in an ARO application.",
854
- "reply": "The `openapi.yaml` file defines the API contract for the application. It specifies the available endpoints, request/response formats, and operation IDs that the application must implement. The `openapi.yaml` file is used to generate the API contract that the application must implement, and it serves as the source of truth for the API's structure and behavior.",
855
  "empty_think": false,
856
- "has_code": false,
857
  "tool_leak": false,
858
  "url_contam": false
859
  },
@@ -861,9 +861,9 @@
861
  "idx": 86,
862
  "cat": "explain",
863
  "prompt": "What does Publish as <alias> do?",
864
- "reply": "The `Publish as <alias>` action exports a variable or value under a specified alias name, making it accessible to other features or handlers. For example, `Publish as <alias> <variable>` makes the variable available for use in subsequent feature sets or event handlers.\n\n```aro\nPublish as <alias> <variable>.\n```",
865
  "empty_think": false,
866
- "has_code": true,
867
  "tool_leak": false,
868
  "url_contam": false
869
  },
@@ -871,7 +871,7 @@
871
  "idx": 87,
872
  "cat": "explain",
873
  "prompt": "How are events routed to feature sets in ARO?",
874
- "reply": "Events are routed to feature sets using the `Emit` action. When an event is emitted, it is published to the event bus, and any feature set that has a handler for that event will receive it.\n\n```aro\nEmit a <UserCreated: event> with <user>.\n```",
875
  "empty_think": false,
876
  "has_code": true,
877
  "tool_leak": false,
@@ -881,7 +881,7 @@
881
  "idx": 88,
882
  "cat": "explain",
883
  "prompt": "What is the role of the EventBus?",
884
- "reply": "The EventBus role is to emit events that can be consumed by event handlers. For example, when a user is created, the EventBus emits a `UserCreated` event that can be handled by a handler to send a welcome email.\n\n```aro\nEmit a <UserCreated: event> with <user>.\n```",
885
  "empty_think": false,
886
  "has_code": true,
887
  "tool_leak": false,
@@ -891,9 +891,9 @@
891
  "idx": 89,
892
  "cat": "explain",
893
  "prompt": "Explain repository observers and how they differ from event handlers.",
894
- "reply": "Repository observers are a design pattern that allows you to react to changes in a repository without directly coupling the repository to the observer. They are similar to event handlers but are more focused on reacting to changes in a repository rather than reacting to events emitted by a service.\n\nIn ARO, repository observers are implemented as event handlers that are triggered when a repository changes. The observer is notified of the change and can react to it.\n\nThe key difference between re",
895
  "empty_think": false,
896
- "has_code": true,
897
  "tool_leak": false,
898
  "url_contam": false
899
  },
@@ -901,7 +901,7 @@
901
  "idx": 90,
902
  "cat": "explain",
903
  "prompt": "What does lazy execution mean in ARO and when is a future forced?",
904
- "reply": "Lazy execution means that the execution of a feature set is delayed until the result is actually needed. The execution is only triggered when the result is explicitly referenced or used in another feature set.\n\nA future is forced when the result of a feature set is explicitly referenced or used in another feature set. For example, if a feature set returns a user object and another feature set uses that user object, the execution of the first feature set is forced when the second feature set uses",
905
  "empty_think": false,
906
  "has_code": true,
907
  "tool_leak": false,
@@ -911,7 +911,7 @@
911
  "idx": 91,
912
  "cat": "edge",
913
  "prompt": "Write an ARO snippet that intentionally fails so the runtime produces a 'Can not ...' message \u2014 explain what triggers that message.",
914
- "reply": "```aro\n(Feature Name: Intentional Failure) {\n Extract the <invalid> from the <request: body>.\n Return an <OK: status> with <invalid>.\n}\n```",
915
  "empty_think": false,
916
  "has_code": true,
917
  "tool_leak": false,
@@ -921,7 +921,7 @@
921
  "idx": 92,
922
  "cat": "edge",
923
  "prompt": "Show me an example of using qualifier-as-name with two different `length` results in the same feature set.",
924
- "reply": "```aro\n(Feature Name: Business Activity) {\n Extract the <first-length: length> from the <first-message>.\n Extract the <second-length: length> from the <second-message>.\n Compare the <first-length> against the <second-length>.\n Return an <OK: status> for the <comparison>.\n}\n```",
925
  "empty_think": false,
926
  "has_code": true,
927
  "tool_leak": false,
@@ -931,7 +931,7 @@
931
  "idx": 93,
932
  "cat": "edge",
933
  "prompt": "Write a feature set with both When guards and a Publish statement.",
934
- "reply": "```aro\n(Feature Name: Conditional Publish) {\n When <status> = \"active\" {\n Publish the <event: \"UserActivated\"> with <user>.\n }\n When <status> = \"inactive\" {\n Publish the <event: \"UserDeactivated\"> with <user>.\n }\n Return an <OK: status> for the <feature>.\n}\n```",
935
  "empty_think": false,
936
  "has_code": true,
937
  "tool_leak": false,
@@ -941,7 +941,7 @@
941
  "idx": 94,
942
  "cat": "edge",
943
  "prompt": "Write a Compute statement that uses a plugin qualifier called Collections.pick-random on a list.",
944
- "reply": "```aro\nCompute the <random-item: collections.pick-random> from the <items>.\n```",
945
  "empty_think": false,
946
  "has_code": true,
947
  "tool_leak": false,
@@ -951,7 +951,7 @@
951
  "idx": 95,
952
  "cat": "edge",
953
  "prompt": "Write a Git action that clones a repository from a URL into ./local-clone.",
954
- "reply": "```aro\n(Clone Repo: Git Action) {\n Extract the <url> from the <input: url>.\n Clone the <repo> from the <url> to the <local: \"./local-clone\">.\n Return an <OK: status> for the <clone>.\n}\n```",
955
  "empty_think": false,
956
  "has_code": true,
957
  "tool_leak": false,
@@ -961,7 +961,7 @@
961
  "idx": 96,
962
  "cat": "edge",
963
  "prompt": "Write a feature set that uses a state-guard `where status = pending` on a custom event.",
964
- "reply": "```aro\n(Feature Name: ProcessPendingEvent) {\n Extract the <event> from the <event: event>.\n Extract the <status> from the <event: status>.\n Where <status> = \"pending\".\n Process the <event> with <status>.\n Return an <OK: status> for the <processing>.\n}\n```",
965
  "empty_think": false,
966
  "has_code": true,
967
  "tool_leak": false,
@@ -971,7 +971,7 @@
971
  "idx": 97,
972
  "cat": "edge",
973
  "prompt": "Show a Render action invocation that fills a Mustache-style template.",
974
- "reply": "```aro\nRender the <html> from the <template: \"email.mustache\"> with { user: <user> }.\n```",
975
  "empty_think": false,
976
  "has_code": true,
977
  "tool_leak": false,
@@ -981,7 +981,7 @@
981
  "idx": 98,
982
  "cat": "edge",
983
  "prompt": "Write a complete .store file plus a feature set that reads from a seeded repository.",
984
- "reply": "**main.aro**\n```aro\n(* Application-Start triggers the entire execution *)\n(Application-Start: Store Demo) {\n Log \"=== Store Demo ===\" to the <console>.\n\n (* Seed the user-repository *)\n Seed the <user-repository> with [\n { id: 1, name: \"Alice\", email: \"alice@example.com\" },\n { id: 2, name: \"Bob\", email: \"bob@example.com\" },\n { id: 3, name: \"Charlie\", email: \"charlie@example.com\" }\n ].\n\n (* Read from the user-repository *)\n Read the <users> from the <user-re",
985
  "empty_think": false,
986
  "has_code": true,
987
  "tool_leak": false,
@@ -991,7 +991,7 @@
991
  "idx": 99,
992
  "cat": "edge",
993
  "prompt": "Write an action that uses a list-range slice (e.g., elements 0..3).",
994
- "reply": "```aro\n(ExtractSlice: Example) {\n Create the <list> with [1, 2, 3, 4, 5].\n Extract the <slice> from the <list: 0..3>.\n Return an <OK: status> with <slice>.\n}\n```",
995
  "empty_think": false,
996
  "has_code": true,
997
  "tool_leak": false,
@@ -1001,7 +1001,7 @@
1001
  "idx": 100,
1002
  "cat": "edge",
1003
  "prompt": "Write an event handler that uses typed event extraction with a schema-validated payload.",
1004
- "reply": "```aro\n(Send Welcome Email: UserCreated Handler) {\n Extract the <user> from the <event: user>.\n Send the <welcome-email> to the <user: email>.\n Return an <OK: status> for the <notification>.\n}\n```",
1005
  "empty_think": false,
1006
  "has_code": true,
1007
  "tool_leak": false,
 
1
  {
2
  "reply_rate": 1.0,
3
  "empty_think_rate": 0.0,
4
+ "syntax_pass_rate": 0.75,
5
  "tool_leak_rate": 0.0,
6
  "url_contam_rate": 0.0,
7
  "total": 100,
8
+ "with_code": 92,
9
  "results": [
10
  {
11
  "idx": 1,
12
  "cat": "repl_oneliner",
13
  "prompt": "Write a single ARO line that logs the message 'Hello, World!' to the console.",
14
+ "reply": "```aro\n(Log: Console) {\n Log \"Hello, World!\" to the <console>.\n}\n```",
15
  "empty_think": false,
16
  "has_code": true,
17
  "tool_leak": false,
 
21
  "idx": 2,
22
  "cat": "repl_oneliner",
23
  "prompt": "Write one ARO statement that retrieves the current time from the clock.",
24
+ "reply": "```aro\n(ReadCurrentTime: Clock) {\n Retrieve the <current-time> from the <clock>.\n Return an <OK: status> with <current-time>.\n}\n```",
25
  "empty_think": false,
26
  "has_code": true,
27
  "tool_leak": false,
 
31
  "idx": 3,
32
  "cat": "repl_oneliner",
33
  "prompt": "Write a single line that computes the length of the string 'banana'.",
34
+ "reply": "Compute the <length: length> from \"banana\".",
35
  "empty_think": false,
36
  "has_code": false,
37
  "tool_leak": false,
 
41
  "idx": 4,
42
  "cat": "repl_oneliner",
43
  "prompt": "Write one ARO statement that converts the string 'hello' to uppercase.",
44
+ "reply": "```aro\n(ToUpper: Example) {\n Create the <text> with \"hello\".\n Compute the <upper: uppercase> from the <text>.\n Return an <OK: status> with <upper>.\n}\n```",
45
  "empty_think": false,
46
  "has_code": true,
47
  "tool_leak": false,
 
51
  "idx": 5,
52
  "cat": "repl_oneliner",
53
  "prompt": "Write one line that hashes the password 'secret'.",
54
+ "reply": "`Compute the <hash> from the <password: \"secret\">.`",
55
  "empty_think": false,
56
  "has_code": false,
57
  "tool_leak": false,
 
71
  "idx": 7,
72
  "cat": "repl_oneliner",
73
  "prompt": "Write one line that retrieves the git status.",
74
+ "reply": "`Get the <git-status> from the <git: status>.`",
75
  "empty_think": false,
76
  "has_code": false,
77
  "tool_leak": false,
 
91
  "idx": 9,
92
  "cat": "repl_oneliner",
93
  "prompt": "Write one ARO statement that reads the file 'config.yaml' from the filesystem.",
94
+ "reply": "```aro\nRead the <config> from the <file: config.yaml>.\n```",
95
  "empty_think": false,
96
  "has_code": true,
97
  "tool_leak": false,
 
111
  "idx": 11,
112
  "cat": "repl_block",
113
  "prompt": "Write a 3-statement ARO snippet that reads a file, uppercases it, and logs the result.",
114
+ "reply": "```aro\nRead the <content> from the <file: path>.\nCompute the <upper> from the <content: uppercase>.\nLog <upper> to the <console>.\n```",
115
  "empty_think": false,
116
  "has_code": true,
117
  "tool_leak": false,
 
121
  "idx": 12,
122
  "cat": "repl_block",
123
  "prompt": "Write a 4-statement snippet that fetches users from a repository, computes the count, and logs it.",
124
+ "reply": "```aro\n(CountUsers: User API) {\n Retrieve the <users> from the <user-repository>.\n Compute the <count> from the <users>.\n Log \"User count: \" ++ <count> to the <console>.\n Return an <OK: status> for the <count>.\n}\n```",
125
  "empty_think": false,
126
  "has_code": true,
127
  "tool_leak": false,
 
131
  "idx": 13,
132
  "cat": "repl_block",
133
  "prompt": "Write an ARO snippet that stages all changes, commits with message 'wip', and pushes.",
134
+ "reply": "```aro\n(StageAndCommit: Git Workflow) {\n Stage the <changes> to the <git>.\n Commit the <changes> with \"wip\".\n Push the <changes> to the <origin>.\n Return an <OK: status> for the <commit>.\n}\n```",
135
  "empty_think": false,
136
  "has_code": true,
137
  "tool_leak": false,
 
141
  "idx": 14,
142
  "cat": "repl_block",
143
  "prompt": "Write a 3-statement snippet that creates a list, computes its length, and logs the length.",
144
+ "reply": "```aro\n(ComputeListLength: Example) {\n Create the <numbers> with [1, 2, 3, 4, 5].\n Compute the <length> from the <numbers>.\n Log <length> to the <console>.\n}\n```",
145
  "empty_think": false,
146
  "has_code": true,
147
  "tool_leak": false,
 
151
  "idx": 15,
152
  "cat": "repl_block",
153
  "prompt": "Write a snippet that extracts a name from an event, uppercases it, and stores it back in a variable.",
154
+ "reply": "```aro\n(ExtractName: Example) {\n Extract the <name> from the <event: name>.\n Compute the <upper-name: uppercase> from the <name>.\n Store the <upper-name> into the <variable>.\n}\n```",
155
  "empty_think": false,
156
  "has_code": true,
157
  "tool_leak": false,
 
161
  "idx": 16,
162
  "cat": "repl_block",
163
  "prompt": "Write a 3-statement snippet that computes 3 + 4, multiplies by 2, and logs the result.",
164
+ "reply": "```aro\n(Compute: Example) {\n Compute the <result> from 3 + 4.\n Compute the <doubled> from <result> * 2.\n Log <doubled> to the <console>.\n}\n```",
165
  "empty_think": false,
166
  "has_code": true,
167
  "tool_leak": false,
 
171
  "idx": 17,
172
  "cat": "repl_block",
173
  "prompt": "Write a snippet that reads two numbers and returns their sum.",
174
+ "reply": "```aro\n(AddTwoNumbers: Example) {\n Create the <a> with 5.\n Create the <b> with 10.\n Compute the <sum> from <a> + <b>.\n Return an <OK: status> with <sum>.\n}\n```",
175
  "empty_think": false,
176
  "has_code": true,
177
  "tool_leak": false,
 
181
  "idx": 18,
182
  "cat": "repl_block",
183
  "prompt": "Write a snippet that filters a list of users where age > 18 and counts them.",
184
+ "reply": "```aro\n(FilterAdults: Example) {\n Create the <users> with [{ name: \"Alice\", age: 25 }, { name: \"Bob\", age: 17 }, { name: \"Charlie\", age: 30 }].\n Filter the <adults> from the <users> where <age> > 18.\n Compute the <count> from the <adults>.\n Return an <OK: status> with <count>.\n}\n```",
185
  "empty_think": false,
186
  "has_code": true,
187
  "tool_leak": false,
 
191
  "idx": 19,
192
  "cat": "repl_block",
193
  "prompt": "Write a snippet that joins two lists and stores the result as <combined>.",
194
+ "reply": "```aro\n(JoinLists: Example) {\n Create the <list-a> with [1, 2, 3].\n Create the <list-b> with [4, 5, 6].\n Compute the <combined> from <list-a> ++ <list-b>.\n Store the <combined> into the <result>.\n Return an <OK: status> for the <result>.\n}\n```",
195
  "empty_think": false,
196
  "has_code": true,
197
  "tool_leak": false,
 
201
  "idx": 20,
202
  "cat": "repl_block",
203
  "prompt": "Write a snippet that parses a JSON string and extracts the 'name' field.",
204
+ "reply": "```aro\n(ParseJson: Example) {\n Create the <json-string> with '{\"name\": \"Alice\", \"age\": 30}'.\n Parse the <parsed> from the <json-string>.\n Extract the <name> from the <parsed: name>.\n Return an <OK: status> with <name>.\n}\n```",
205
  "empty_think": false,
206
  "has_code": true,
207
  "tool_leak": false,
 
221
  "idx": 22,
222
  "cat": "user_action",
223
  "prompt": "Write a user-defined action 'Greet' that takes a name and returns a greeting string.",
224
+ "reply": "```aro\n(Greet: Action) {\n Extract the <name> from the <input: name>.\n Compute the <greeting> from \"Hello, \" ++ <name>.\n Return an <OK: status> with <greeting>.\n}\n```",
225
  "empty_think": false,
226
  "has_code": true,
227
  "tool_leak": false,
 
231
  "idx": 23,
232
  "cat": "user_action",
233
  "prompt": "Write a user-defined action 'AddTwoNumbers' that takes two numbers and returns their sum.",
234
+ "reply": "```aro\n(AddTwoNumbers: Action) {\n Extract the <a> from the <input: a>.\n Extract the <b> from the <input: b>.\n Compute the <sum> from <a> + <b>.\n Return an <OK: status> with <sum>.\n}\n```",
235
  "empty_think": false,
236
  "has_code": true,
237
  "tool_leak": false,
 
241
  "idx": 24,
242
  "cat": "user_action",
243
  "prompt": "Write a user-defined action 'ValidateEmail' that takes an email string and returns OK or Error.",
244
+ "reply": "```aro\n(ValidateEmail: Email Validation) {\n Extract the <email> from the <input: email>.\n Validate the <email> against the <email-validation-pattern>.\n Return an <OK: status> for the <valid: email>.\n}\n```",
245
  "empty_think": false,
246
  "has_code": true,
247
  "tool_leak": false,
 
251
  "idx": 25,
252
  "cat": "user_action",
253
  "prompt": "Write a user-defined action 'Square' that takes a number and returns its square.",
254
+ "reply": "```aro\n(Square: Action takes <number>) {\n Extract the <n> from the <input: number>.\n Compute the <square> from <n> * <n>.\n Return an <OK: status> with { square: <square> }.\n}\n```",
255
  "empty_think": false,
256
  "has_code": true,
257
  "tool_leak": false,
 
261
  "idx": 26,
262
  "cat": "user_action",
263
  "prompt": "Write a user-defined action 'FormatDate' that takes a date and a format string.",
264
+ "reply": "```aro\n(FormatDate: Action) {\n Extract the <date> from the <input: date>.\n Extract the <format> from the <input: format>.\n Format the <formatted-date> from the <date> with <format>.\n Return an <OK: status> with <formatted-date>.\n}\n```",
265
  "empty_think": false,
266
  "has_code": true,
267
  "tool_leak": false,
 
271
  "idx": 27,
272
  "cat": "user_action",
273
  "prompt": "Write a user-defined action 'CountWords' that takes a string and returns the word count.",
274
+ "reply": "```aro\n(CountWords: Action) {\n Extract the <text> from the <input: text>.\n Split the <words> from the <text> by whitespace.\n Count the <word-count> from the <words>.\n Return an <OK: status> with { count: <word-count> }.\n}\n```",
275
  "empty_think": false,
276
  "has_code": true,
277
  "tool_leak": false,
 
281
  "idx": 28,
282
  "cat": "user_action",
283
  "prompt": "Write a user-defined action 'PickRandom' that takes a list and returns a random element.",
284
+ "reply": "```aro\n(PickRandom: Action) {\n Extract the <list> from the <input>.\n Compute the <random-element> from the <list>.\n Return an <OK: status> with <random-element>.\n}\n```",
285
  "empty_think": false,
286
  "has_code": true,
287
  "tool_leak": false,
 
291
  "idx": 29,
292
  "cat": "user_action",
293
  "prompt": "Write a user-defined action 'Capitalize' that takes a string and uppercases its first letter.",
294
+ "reply": "```aro\n(Capitalize: Action) {\n Extract the <text> from the <input>.\n Compute the <capitalized> from <text>.\n Return an <OK: status> with <capitalized>.\n}\n```",
295
  "empty_think": false,
296
  "has_code": true,
297
  "tool_leak": false,
 
321
  "idx": 32,
322
  "cat": "event_handler",
323
  "prompt": "Write an event handler for OrderPlaced that decrements inventory.",
324
+ "reply": "```aro\n(OrderPlaced Handler: Inventory Update) {\n Extract the <order> from the <event: order>.\n Extract the <items> from the <order: items>.\n For each <item> in <items> {\n Extract the <productId> from the <item: product>.\n Extract the <quantity> from the <item: quantity>.\n Decrement the <inventory> for the <productId> by <quantity>.\n }\n Return an <OK: status> for the <update>.\n}\n```",
325
  "empty_think": false,
326
  "has_code": true,
327
  "tool_leak": false,
 
331
  "idx": 33,
332
  "cat": "event_handler",
333
  "prompt": "Write an event handler for PaymentFailed that logs the error and notifies the user.",
334
+ "reply": "```aro\n(PaymentFailed Handler: Payment API) {\n Extract the <error> from the <event: error>.\n Log \"Payment failed: \" ++ <error> to the <console>.\n Notify the <user> with \"Payment failed: \" ++ <error>.\n Return an <OK: status> for the <handler>.\n}\n```",
335
  "empty_think": false,
336
  "has_code": true,
337
  "tool_leak": false,
 
341
  "idx": 34,
342
  "cat": "event_handler",
343
  "prompt": "Write an event handler for FileChanged that re-reads the configuration.",
344
+ "reply": "```aro\n(FileChanged Handler: Config Reload) {\n Log \"Reloading configuration...\" to the <console>.\n Read the <config> from the <config-file>.\n Store the <config> into the <config-store>.\n Return an <OK: status> for the <reload>.\n}\n```",
345
  "empty_think": false,
346
  "has_code": true,
347
  "tool_leak": false,
 
351
  "idx": 35,
352
  "cat": "event_handler",
353
  "prompt": "Write an event handler for LoginAttempt that records the IP address.",
354
+ "reply": "```aro\n(RecordLoginAttempt: LoginAttempt Handler) {\n Extract the <ip> from the <event: ip>.\n Log <ip> to the <console>.\n Return an <OK: status> for the <record>.\n}\n```",
355
  "empty_think": false,
356
  "has_code": true,
357
  "tool_leak": false,
 
361
  "idx": 36,
362
  "cat": "event_handler",
363
  "prompt": "Write an event handler for GitPush that triggers a CI build.",
364
+ "reply": "```aro\n(GitPush: Event Handler) {\n Extract the <branch> from the <event: branch>.\n Extract the <commit> from the <event: commit>.\n Log \"Git push detected on branch: \" ++ <branch> to the <console>.\n Log \"Commit hash: \" ++ <commit> to the <console>.\n Return an <OK: status> for the <event-handling>.\n}\n```",
365
  "empty_think": false,
366
  "has_code": true,
367
  "tool_leak": false,
 
371
  "idx": 37,
372
  "cat": "event_handler",
373
  "prompt": "Write an event handler for SubscriptionExpired that downgrades the account.",
374
+ "reply": "```aro\n(DowngradeSubscription: SubscriptionExpired Handler) {\n Extract the <account> from the <event: account>.\n Downgrade the <account> with <account>.\n Return an <OK: status> for the <downgrade>.\n}\n```",
375
  "empty_think": false,
376
  "has_code": true,
377
  "tool_leak": false,
 
381
  "idx": 38,
382
  "cat": "event_handler",
383
  "prompt": "Write an event handler for ServerStarted that warms up the cache.",
384
+ "reply": "```aro\n(WarmUpCache: ServerStarted Handler) {\n Log \"Warming up cache...\" to the <console>.\n Cache the <cache-data> from the <cache-source>.\n Return an <OK: status> for the <warm-up>.\n}\n```",
385
  "empty_think": false,
386
  "has_code": true,
387
  "tool_leak": false,
 
391
  "idx": 39,
392
  "cat": "event_handler",
393
  "prompt": "Write an event handler for MessageReceived that echoes the message back.",
394
+ "reply": "```aro\n(EchoMessage: MessageReceived Handler) {\n Extract the <message> from the <event: message>.\n Log \"Echoing: \" ++ <message> to the <console>.\n Return an <OK: status> for the <echo>.\n}\n```",
395
  "empty_think": false,
396
  "has_code": true,
397
  "tool_leak": false,
 
401
  "idx": 40,
402
  "cat": "event_handler",
403
  "prompt": "Write an event handler for ImageUploaded that generates a thumbnail.",
404
+ "reply": "```aro\n(ImageThumbnail: ImageUploaded Handler) {\n Extract the <image> from the <event: image>.\n Compute the <thumbnail> from the <image: thumbnail>.\n Store the <thumbnail> into the <thumbnail-repository>.\n Return an <OK: status> for the <thumbnail-generation>.\n}\n```",
405
  "empty_think": false,
406
  "has_code": true,
407
  "tool_leak": false,
 
411
  "idx": 41,
412
  "cat": "application",
413
  "prompt": "Write a complete ARO Application-Start that prints Hello and exits.",
414
+ "reply": "```aro\n(Application-Start: Example) {\n Log \"Hello\" to the <console>.\n Return an <OK: status> for the <result>.\n}\n```",
415
  "empty_think": false,
416
  "has_code": true,
417
  "tool_leak": false,
 
421
  "idx": 42,
422
  "cat": "application",
423
  "prompt": "Write a complete Application-Start that starts an HTTP server on port 8080.",
424
+ "reply": "```aro\n(Application-Start: HTTP Server) {\n Start the <http-server> with { port: 8080 }.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n```",
425
  "empty_think": false,
426
  "has_code": true,
427
  "tool_leak": false,
 
431
  "idx": 43,
432
  "cat": "application",
433
  "prompt": "Write a complete Application-Start that watches a directory for changes.",
434
+ "reply": "```aro\n(Application-Start: Watcher) {\n Log \"Starting watcher...\" to the <console>.\n Start the <file-monitor> with <directory>.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n```",
435
  "empty_think": false,
436
  "has_code": true,
437
  "tool_leak": false,
 
451
  "idx": 45,
452
  "cat": "application",
453
  "prompt": "Write a complete Application-Start that opens a TCP echo server on port 9000.",
454
+ "reply": "```aro\n(Application-Start: Echo Server) {\n Start the <tcp-server> with { port: 9000, echo: true }.\n Log \"Echo server started on port 9000\" to the <console>.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n```",
455
  "empty_think": false,
456
  "has_code": true,
457
  "tool_leak": false,
 
461
  "idx": 46,
462
  "cat": "application",
463
  "prompt": "Write a complete Application-Start that starts a WebSocket server and keeps it alive.",
464
+ "reply": "```aro\n(Application-Start: WebSocket Server) {\n Start the <websocket-server> with <port>.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n```",
465
  "empty_think": false,
466
  "has_code": true,
467
  "tool_leak": false,
 
471
  "idx": 47,
472
  "cat": "application",
473
  "prompt": "Write a complete Application-Start that connects to a database and runs a single query.",
474
+ "reply": "```aro\n(Application-Start: My App) {\n Log \"Starting...\" to the <console>.\n Connect to the <database> with <config>.\n Query the <database> for the <query>.\n Return an <OK: status> for the <startup>.\n}\n```",
475
  "empty_think": false,
476
  "has_code": true,
477
  "tool_leak": false,
 
481
  "idx": 48,
482
  "cat": "application",
483
  "prompt": "Write a complete Application-Start that reads command-line parameters and prints them.",
484
+ "reply": "```aro\n(Application-Start: Example) {\n Read the <args> from the <command-line>.\n Log \"Args:\" to the <console>.\n Log <args> to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
485
  "empty_think": false,
486
  "has_code": true,
487
  "tool_leak": false,
 
491
  "idx": 49,
492
  "cat": "application",
493
  "prompt": "Write a complete Application-Start that loads a configuration file and logs it.",
494
+ "reply": "```aro\n(Application-Start: My App) {\n Read the <config> from the <file: config.json>.\n Log \"Loaded config:\" to the <console>.\n Log <config> to the <console>.\n Return an <OK: status> for the <startup>.\n}\n```",
495
  "empty_think": false,
496
  "has_code": true,
497
  "tool_leak": false,
 
501
  "idx": 50,
502
  "cat": "application",
503
  "prompt": "Write a complete Application-Start that prints the current git branch.",
504
+ "reply": "```aro\n(Application-Start: My App) {\n Log \"Starting...\" to the <console>.\n Start the <http-server> with <contract>.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n```",
505
  "empty_think": false,
506
  "has_code": true,
507
  "tool_leak": false,
 
521
  "idx": 52,
522
  "cat": "http_api",
523
  "prompt": "Write the openapi.yaml plus feature set for a POST /products endpoint.",
524
+ "reply": "```yaml\n# openapi.yaml\nopenapi: 3.0.3\ninfo:\n title: Product API\n description: API for managing products\n version: 1.0.0\nservers:\n - url:\npaths:\n /products:\n post:\n summary: Create a new product\n description: Create a new product with the given details\n operationId: createProduct\n requestBody:\n required: true\n content:\n application/json:\n schema:\n $ref: '#/components/schemas/Product'\n responses:\n '201':\n ",
525
  "empty_think": false,
526
  "has_code": true,
527
  "tool_leak": false,
 
541
  "idx": 54,
542
  "cat": "http_api",
543
  "prompt": "Write a feature set for createOrder that validates the request body and emits OrderCreated.",
544
+ "reply": "```aro\n(createOrder: Order API) {\n Extract the <request-body> from the <request: body>.\n Validate the <request-body> for the <order-schema>.\n Emit an <OrderCreated: event> with <request-body>.\n Return an <OK: status> with <request-body>.\n}\n```",
545
  "empty_think": false,
546
  "has_code": true,
547
  "tool_leak": false,
 
551
  "idx": 55,
552
  "cat": "http_api",
553
  "prompt": "Write a feature set for deleteSession that removes a session from the sessions-repository.",
554
+ "reply": "```aro\n(deleteSession: Session API) {\n Extract the <session-id> from the <request: id>.\n Delete the <session> from the <sessions-repository> where <id> = <session-id>.\n Return an <OK: status> for the <deletion>.\n}\n```",
555
  "empty_think": false,
556
  "has_code": true,
557
  "tool_leak": false,
 
561
  "idx": 56,
562
  "cat": "http_api",
563
  "prompt": "Write a feature set for searchProducts that takes a query parameter and filters results.",
564
+ "reply": "```aro\n(searchProducts: Product API) {\n Extract the <query> from the <request: query>.\n Retrieve the <products> from the <product-repository>.\n Filter the <filtered-products> from the <products> where <name> contains <query>.\n Return an <OK: status> with <filtered-products>.\n}\n```",
565
  "empty_think": false,
566
  "has_code": true,
567
  "tool_leak": false,
 
571
  "idx": 57,
572
  "cat": "http_api",
573
  "prompt": "Write a feature set for updateProfile that patches a user record.",
574
+ "reply": "```aro\n(updateProfile: User API) {\n Extract the <user-id> from the <pathParameters: id>.\n Extract the <update-data> from the <request: body>.\n Retrieve the <existing-user> from the <user-repository> where id = <user-id>.\n Patch the <updated-user> from the <existing-user> with <update-data>.\n Store the <updated-user> into the <user-repository>.\n Return an <OK: status> with the <updated-user>.\n}\n```",
575
  "empty_think": false,
576
  "has_code": true,
577
  "tool_leak": false,
 
581
  "idx": 58,
582
  "cat": "http_api",
583
  "prompt": "Write a feature set for healthCheck that returns OK.",
584
+ "reply": "```aro\n(healthCheck: Health Check) {\n Return an <OK: status> for the <health-check>.\n}\n```",
585
  "empty_think": false,
586
  "has_code": true,
587
  "tool_leak": false,
 
611
  "idx": 61,
612
  "cat": "repository",
613
  "prompt": "Write a repository observer for the users-repository that logs every change.",
614
+ "reply": "```aro\n(UsersRepositoryObserver: User API) {\n Extract the <user> from the <user-repository>.\n Log <user> to the <console>.\n Return an <OK: status> for the <observation>.\n}\n```",
615
  "empty_think": false,
616
  "has_code": true,
617
  "tool_leak": false,
 
621
  "idx": 62,
622
  "cat": "repository",
623
  "prompt": "Write a repository observer for orders-repository that emits OrderUpdated when records change.",
624
+ "reply": "```aro\n(UpdateOrder: Order API) {\n Extract the <order> from the <request: body>.\n Store the <order> into the <order-repository>.\n Emit an <OrderUpdated: event> with <order>.\n Return an <OK: status> with <order>.\n}\n```",
625
  "empty_think": false,
626
  "has_code": true,
627
  "tool_leak": false,
 
651
  "idx": 65,
652
  "cat": "repository",
653
  "prompt": "Write an observer that triggers when a user is deleted from the user-repository.",
654
+ "reply": "```aro\n(DeleteUserObserver: User API) {\n Extract the <user> from the <event: user>.\n Log \"User deleted: \" ++ <user: id> to the <console>.\n Return an <OK: status> for the <deletion>.\n}\n```",
655
  "empty_think": false,
656
  "has_code": true,
657
  "tool_leak": false,
 
661
  "idx": 66,
662
  "cat": "repository",
663
  "prompt": "Write a feature set that updates a record in the inventory-repository.",
664
+ "reply": "```aro\n(UpdateInventoryRecord: Inventory API) {\n Extract the <record> from the <request: body>.\n Store the <record> into the <inventory-repository>.\n Return an <OK: status> with <record>.\n}\n```",
665
  "empty_think": false,
666
  "has_code": true,
667
  "tool_leak": false,
 
671
  "idx": 67,
672
  "cat": "repository",
673
  "prompt": "Write a state-guarded handler that triggers only on UserUpdated where role = admin.",
674
+ "reply": "```aro\n(UpdateAdmin: UserUpdated Handler) {\n Extract the <user> from the <event: user>.\n Extract the <role> from the <user: role>.\n when <role> = \"admin\" {\n Log \"Admin user updated\" to the <console>.\n Return an <OK: status> for the <update>.\n }\n Return an <OK: status> for the <update>.\n}\n```",
675
  "empty_think": false,
676
  "has_code": true,
677
  "tool_leak": false,
 
681
  "idx": 68,
682
  "cat": "repository",
683
  "prompt": "Write a feature set that bulk-imports a list of users into the user-repository.",
684
+ "reply": "```aro\n(BulkImportUsers: User API) {\n Extract the <users> from the <request: body>.\n For each <user> in <users> {\n Store the <user> into the <user-repository>.\n }\n Return an <OK: status> with <users>.\n}\n```",
685
  "empty_think": false,
686
  "has_code": true,
687
  "tool_leak": false,
 
691
  "idx": 69,
692
  "cat": "repository",
693
  "prompt": "Write a feature set that publishes the count of orders as a global variable.",
694
+ "reply": "```aro\n(CountOrders: Order API) {\n Retrieve the <orders> from the <order-repository>.\n Compute the <order-count> from the <orders: length>.\n Publish as <order-count> <order-count>.\n Return an <OK: status> with <order-count>.\n}\n```",
695
  "empty_think": false,
696
  "has_code": true,
697
  "tool_leak": false,
 
701
  "idx": 70,
702
  "cat": "repository",
703
  "prompt": "Write a repository observer that retries on failure.",
704
+ "reply": "```aro\n(ObserveUserRepository: User API) {\n Extract the <user> from the <user-repository>.\n Return an <OK: status> with <user>.\n}\n```",
705
  "empty_think": false,
706
  "has_code": true,
707
  "tool_leak": false,
 
711
  "idx": 71,
712
  "cat": "refactor",
713
  "prompt": "Refactor this snippet to use the qualifier-as-name syntax: `Compute the <length> from <a>. Compute the <length> from <b>.`",
714
+ "reply": "```aro\n(ComputeLength: Example) {\n Compute the <length-a: length> from <a>.\n Compute the <length-b: length> from <b>.\n}\n```",
715
  "empty_think": false,
716
  "has_code": true,
717
  "tool_leak": false,
 
721
  "idx": 72,
722
  "cat": "refactor",
723
  "prompt": "Fix this snippet so it parses: `Log Hello to console.`",
724
+ "reply": "```aro\n(Log Hello: Console Output) {\n Log \"Hello\" to the <console>.\n}\n```",
725
  "empty_think": false,
726
  "has_code": true,
727
  "tool_leak": false,
 
751
  "idx": 75,
752
  "cat": "refactor",
753
  "prompt": "Rewrite this ARO snippet to use lazy evaluation idioms: `Compute the <a> from 1+1. Compute the <b> from <a>+1. Log <b> to the <console>.`",
754
+ "reply": "```aro\n(ComputeLazy: Example) {\n Compute the <a> from 1 + 1.\n Compute the <b> from <a> + 1.\n Log <b> to the <console>.\n}\n```",
755
  "empty_think": false,
756
  "has_code": true,
757
  "tool_leak": false,
 
761
  "idx": 76,
762
  "cat": "refactor",
763
  "prompt": "Split this monolithic feature set into one Application-Start and one event handler: `(Foo: My App) { Log \"start\" to <console>. Emit a <Started: event>. Log \"after\" to <console>. }`",
764
+ "reply": "```aro\n(Application-Start: My App) {\n Log \"Starting...\" to the <console>.\n Start the <http-server> with <contract>.\n Keepalive the <application> for the <events>.\n Return an <OK: status> for the <startup>.\n}\n\n(Started: Event Handler) {\n Log \"Started event received\" to the <console>.\n Return an <OK: status> for the <event>.\n}\n```",
765
  "empty_think": false,
766
  "has_code": true,
767
  "tool_leak": false,
 
771
  "idx": 77,
772
  "cat": "refactor",
773
  "prompt": "Add a When guard to this handler so it only runs for admin users: `(OnUserUpdated: UserUpdated Handler) { Log <event> to the <console>. Return an <OK: status> for <log>. }`",
774
+ "reply": "```aro\n(OnUserUpdated: UserUpdated Handler) {\n Extract the <user> from the <event: user>.\n When <user: role> = \"admin\" {\n Log <event> to the <console>.\n Return an <OK: status> for <log>.\n }\n}\n```",
775
  "empty_think": false,
776
  "has_code": true,
777
  "tool_leak": false,
 
781
  "idx": 78,
782
  "cat": "refactor",
783
  "prompt": "Replace direct repository writes with an emitted event in this feature set: `(saveUser: User API) { Store the <user> in the <user-repository>. Return an <OK: status>. }`",
784
+ "reply": "```aro\n(saveUser: User API) {\n Extract the <user> from the <request: body>.\n Emit a <UserSaved: event> with <user>.\n Return an <OK: status> with <user>.\n}\n```",
785
  "empty_think": false,
786
  "has_code": true,
787
  "tool_leak": false,
 
791
  "idx": 79,
792
  "cat": "refactor",
793
  "prompt": "Convert this REPL one-liner into a proper feature set: `Log \"Hi\" to the <console>.`",
794
+ "reply": "```aro\n(HelloWorld: Example) {\n Log \"Hi\" to the <console>.\n Return an <OK: status> for the <example>.\n}\n```",
795
  "empty_think": false,
796
  "has_code": true,
797
  "tool_leak": false,
 
801
  "idx": 80,
802
  "cat": "refactor",
803
  "prompt": "Refactor a duplicated three-line greeting flow into a single user-defined action called Greet.",
804
+ "reply": "```aro\n(Greet: Greeting Action) {\n Create the <greeting> with \"Hello, \" ++ <name>.\n Log <greeting> to the <console>.\n Return an <OK: status> for the <greeting>.\n}\n```",
805
  "empty_think": false,
806
  "has_code": true,
807
  "tool_leak": false,
 
811
  "idx": 81,
812
  "cat": "explain",
813
  "prompt": "What does the Keepalive action do in ARO?",
814
+ "reply": "The `Keepalive` action keeps the application running by keeping the event loop alive. It's used to keep the application running when there are no active events to process.\n\n```aro\nKeepalive the <application> for the <events>.\n```",
815
  "empty_think": false,
816
  "has_code": true,
817
  "tool_leak": false,
 
821
  "idx": 82,
822
  "cat": "explain",
823
  "prompt": "Explain the difference between Application-Start and an event handler.",
824
+ "reply": "Application-Start is the entry point for the application. It's where the application starts and initializes its components. Event handlers, on the other hand, are triggered by specific events and are used to handle those events.\n\nApplication-Start is responsible for starting the application and initializing its components. It's the first thing that happens when the application starts.\n\nEvent handlers are triggered by specific events and are used to handle those events. They are responsible for h",
825
  "empty_think": false,
826
  "has_code": false,
827
  "tool_leak": false,
 
831
  "idx": 83,
832
  "cat": "explain",
833
  "prompt": "What is the difference between OWN and EXPORT action roles?",
834
+ "reply": "The `OWN` role is for actions that are part of the application's internal logic, such as business rules, data transformations, and event handling. These actions are typically used to process data within the application.\n\nThe `EXPORT` role is for actions that are part of the application's external interface, such as HTTP endpoints, event handlers, and notifications. These actions are typically used to expose data to external systems or users.\n\nHere's an example of how to use each role:\n\n```aro\n(O",
835
  "empty_think": false,
836
  "has_code": true,
837
  "tool_leak": false,
 
841
  "idx": 84,
842
  "cat": "explain",
843
  "prompt": "How does ARO's error philosophy work? What is 'code is the error message'?",
844
+ "reply": "ARO's error philosophy is built on the principle that \"code is the error message.\" This means that the code itself contains all the necessary information to diagnose and fix errors, without needing external error messages or error codes.\n\nIn ARO, errors are handled by the code itself. If an error occurs during execution, the code will fail with a descriptive error message that includes the line and context where the error occurred. This makes it easy to identify and fix issues.\n\nFor example, if ",
845
  "empty_think": false,
846
  "has_code": false,
847
  "tool_leak": false,
 
851
  "idx": 85,
852
  "cat": "explain",
853
  "prompt": "Explain what the openapi.yaml file does in an ARO application.",
854
+ "reply": "The `openapi.yaml` file defines the API contract for the application. It lists all the available operations (like `listUsers`, `createUser`, `getUser`) and their parameters, responses, and other metadata. The section shows that `openapi.yaml` is used to define the API contract, which is then used to generate the application's API endpoints.\n\n```aro\n(listUsers: User API) {\n Retrieve the <users> from the <user-repository>.\n Return an <OK: status> with <users>.\n}\n```",
855
  "empty_think": false,
856
+ "has_code": true,
857
  "tool_leak": false,
858
  "url_contam": false
859
  },
 
861
  "idx": 86,
862
  "cat": "explain",
863
  "prompt": "What does Publish as <alias> do?",
864
+ "reply": "The `Publish as <alias>` action makes a variable available to other feature sets. The section shows `Publish as <alias> <variable>` \u2014 this makes the `variable` available to other feature sets.",
865
  "empty_think": false,
866
+ "has_code": false,
867
  "tool_leak": false,
868
  "url_contam": false
869
  },
 
871
  "idx": 87,
872
  "cat": "explain",
873
  "prompt": "How are events routed to feature sets in ARO?",
874
+ "reply": "Events are routed to feature sets using the `Emit` action. The section shows `Emit a <UserCreated: event> with <user>.` which routes the event to the `UserCreated Handler` feature set.\n\n```aro\nEmit a <UserCreated: event> with <user>.\n```",
875
  "empty_think": false,
876
  "has_code": true,
877
  "tool_leak": false,
 
881
  "idx": 88,
882
  "cat": "explain",
883
  "prompt": "What is the role of the EventBus?",
884
+ "reply": "The EventBus is a central component for event-driven communication in the application. It allows different parts of the application to communicate without direct coupling. Events are emitted by features and can be consumed by event handlers.\n\n```aro\n(EmitEvent: Example) {\n Emit a <UserRegistered: event> with { id: 1, name: \"Alice\" }.\n Return an <OK: status> for the <event>.\n}\n```",
885
  "empty_think": false,
886
  "has_code": true,
887
  "tool_leak": false,
 
891
  "idx": 89,
892
  "cat": "explain",
893
  "prompt": "Explain repository observers and how they differ from event handlers.",
894
+ "reply": "Repository observers are a pattern for reacting to changes in a repository. They are similar to event handlers but are more lightweight and focused on reacting to specific repository events.\n\nThe key difference is that repository observers are triggered by specific repository events, while event handlers are triggered by any event emitted by any feature set.\n\nHere's how they differ:\n\n1. **Trigger**: Repository observers are triggered by specific repository events (like `UserCreated`), while even",
895
  "empty_think": false,
896
+ "has_code": false,
897
  "tool_leak": false,
898
  "url_contam": false
899
  },
 
901
  "idx": 90,
902
  "cat": "explain",
903
  "prompt": "What does lazy execution mean in ARO and when is a future forced?",
904
+ "reply": "Lazy execution means that the execution of a feature set is delayed until a `Return` or `Emit` statement is encountered. The section shows:\n```aro\n(Feature Name: Business Activity) {\n Extract the <result: qualifier> from the <source: qualifier>.\n Compute the <output> for the <input>.\n Return an <OK: status> for a <valid: result>.\n Publish as <alias> <variable>.\n}\n```\nThe `Return` statement forces the execution to complete.",
905
  "empty_think": false,
906
  "has_code": true,
907
  "tool_leak": false,
 
911
  "idx": 91,
912
  "cat": "edge",
913
  "prompt": "Write an ARO snippet that intentionally fails so the runtime produces a 'Can not ...' message \u2014 explain what triggers that message.",
914
+ "reply": "```aro\n(Fail: Example) {\n Create the <x> with 42.\n Return an <OK: status> with <x>.\n}\n```",
915
  "empty_think": false,
916
  "has_code": true,
917
  "tool_leak": false,
 
921
  "idx": 92,
922
  "cat": "edge",
923
  "prompt": "Show me an example of using qualifier-as-name with two different `length` results in the same feature set.",
924
+ "reply": "```aro\n(Lengths: Example) {\n Create the <message-a> with \"hello\".\n Compute the <length-a: length> from the <message-a>.\n Create the <message-b> with \"world\".\n Compute the <length-b: length> from the <message-b>.\n Return an <OK: status> for the <result>.\n}\n```",
925
  "empty_think": false,
926
  "has_code": true,
927
  "tool_leak": false,
 
931
  "idx": 93,
932
  "cat": "edge",
933
  "prompt": "Write a feature set with both When guards and a Publish statement.",
934
+ "reply": "```aro\n(ValidateUser: User API) {\n Extract the <user> from the <request: body>.\n When <user: email> is not null {\n Log \"Validating user...\" to the <console>.\n Validate the <user> with <validation-rules>.\n Return an <OK: status> with <user>.\n }\n When <user: password> is not null {\n Log \"Validating user password...\" to the <console>.\n Validate the <user: password> with <password-rules>.\n Return an <OK: status> with <user>.\n }\n Publish a <",
935
  "empty_think": false,
936
  "has_code": true,
937
  "tool_leak": false,
 
941
  "idx": 94,
942
  "cat": "edge",
943
  "prompt": "Write a Compute statement that uses a plugin qualifier called Collections.pick-random on a list.",
944
+ "reply": "```aro\n(ComputeRandomItem: Example) {\n Create the <items> with [\"a\", \"b\", \"c\"].\n Compute the <random-item: collections.pick-random> from the <items>.\n Return an <OK: status> with <random-item>.\n}\n```",
945
  "empty_think": false,
946
  "has_code": true,
947
  "tool_leak": false,
 
951
  "idx": 95,
952
  "cat": "edge",
953
  "prompt": "Write a Git action that clones a repository from a URL into ./local-clone.",
954
+ "reply": "```aro\n(Clone: Git Action) {\n Extract the <url> from the <input: url>.\n Clone the <repo> from the <url> to the <local-clone>.\n Return an <OK: status> for the <clone>.\n}\n```",
955
  "empty_think": false,
956
  "has_code": true,
957
  "tool_leak": false,
 
961
  "idx": 96,
962
  "cat": "edge",
963
  "prompt": "Write a feature set that uses a state-guard `where status = pending` on a custom event.",
964
+ "reply": "```aro\n(ValidatePendingOrder: Order API) {\n Extract the <order> from the <request: body>.\n Where the <status> is <pending> {\n Log \"Processing pending order\" to the <console>.\n Return an <OK: status> with <order>.\n }\n Return a <Conflict: status> with \"Order status must be pending\".\n}\n```",
965
  "empty_think": false,
966
  "has_code": true,
967
  "tool_leak": false,
 
971
  "idx": 97,
972
  "cat": "edge",
973
  "prompt": "Show a Render action invocation that fills a Mustache-style template.",
974
+ "reply": "```aro\n(Render: Template) {\n Create the <template> with \"Hello, {{name}}!\".\n Render the <output> with <template> and { name: \"World\" }.\n Return an <OK: status> with <output>.\n}\n```",
975
  "empty_think": false,
976
  "has_code": true,
977
  "tool_leak": false,
 
981
  "idx": 98,
982
  "cat": "edge",
983
  "prompt": "Write a complete .store file plus a feature set that reads from a seeded repository.",
984
+ "reply": "**main.aro**\n```aro\n(* Store file - seed data *)\n\n(Application-Start: Store Example) {\n Log \"=== Store Example ===\" to the <console>.\n Log \"Loading user data from store...\" to the <console>.\n\n (* Seed data *)\n Create the <user1> with { id: 1, name: \"Alice\", email: \"alice@example.com\" }.\n Create the <user2> with { id: 2, name: \"Bob\", email: \"bob@example.com\" }.\n Create the <user3> with { id: 3, name: \"Charlie\", email: \"charlie@example.com\" }.\n\n Store the <user1> into the <use",
985
  "empty_think": false,
986
  "has_code": true,
987
  "tool_leak": false,
 
991
  "idx": 99,
992
  "cat": "edge",
993
  "prompt": "Write an action that uses a list-range slice (e.g., elements 0..3).",
994
+ "reply": "```aro\n(SliceList: Action) {\n Extract the <list> from the <input>.\n Extract the <start> from the <input: start>.\n Extract the <end> from the <input: end>.\n Compute the <sliced> from the <list> with <start> to <end>.\n Return an <OK: status> with <sliced>.\n}\n```",
995
  "empty_think": false,
996
  "has_code": true,
997
  "tool_leak": false,
 
1001
  "idx": 100,
1002
  "cat": "edge",
1003
  "prompt": "Write an event handler that uses typed event extraction with a schema-validated payload.",
1004
+ "reply": "```aro\n(ValidateUserEvent: UserCreated Handler) {\n Extract the <user> from the <event: user>.\n Validate the <user> against the <user-schema>.\n Return an <OK: status> for the <validation>.\n}\n```",
1005
  "empty_think": false,
1006
  "has_code": true,
1007
  "tool_leak": false,