| {"mode": "argument_shaping", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for browser_search with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}} |
| {"mode": "harness_envelope", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how browser_search behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether browser_search is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}} |
| {"mode": "argument_shaping", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for browser_search so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}} |
| {"mode": "precondition_gating", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run browser_search but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}} |
| {"mode": "receipt_and_validation", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for browser_search.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}} |
| {"mode": "harness_envelope", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat browser_search as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}} |
| {"mode": "runtime_session", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after browser_search.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}} |
| {"mode": "worktree_permission", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how browser_search must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if browser_search must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}} |
| {"mode": "argument_shaping", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nDo not shape arguments as if this were repo_reverse_engineer; normalize the request into the strict schema for browser_search only.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 2}} |
| {"mode": "precondition_gating", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants browser_search immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}} |
| {"mode": "receipt_and_validation", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter browser_search finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}} |
| {"mode": "harness_envelope", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"search query\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"query\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"integer\",\n \"default_value\": 5,\n \"description\": \"maximum hits\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"top_k\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 1,\n \"sandbox_cost_estimate\": 0,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 2500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"network\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": false,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Search tool under runtime/network/validator discipline.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"retrieved evidence bundle\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"results\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"search execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"network\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"open_web\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Search public web sources and return evidence candidates.\",\n \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nUnder control-plane priority, explain why browser_search is the bounded move here while run_ci_validation stays subordinate or unused.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 2}} |
| {"mode": "tool_trigger", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether apply_patch_bundle is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}} |
| {"mode": "receipt_and_validation", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for apply_patch_bundle.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if apply_patch_bundle must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}} |
| {"mode": "argument_shaping", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for apply_patch_bundle with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}} |
| {"mode": "precondition_gating", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run apply_patch_bundle but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}} |
| {"mode": "receipt_and_validation", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter apply_patch_bundle finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}} |
| {"mode": "harness_envelope", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how apply_patch_bundle behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}} |
| {"mode": "runtime_session", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after apply_patch_bundle.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}} |
| {"mode": "worktree_permission", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how apply_patch_bundle must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nChoose between apply_patch_bundle and run_ci_validation; trigger apply_patch_bundle only if its capability, not the competing tool, matches the bounded task.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 2}} |
| {"mode": "argument_shaping", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for apply_patch_bundle so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}} |
| {"mode": "precondition_gating", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants apply_patch_bundle immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}} |
| {"mode": "receipt_and_validation", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nEmit the receipt fields that prove apply_patch_bundle, not run_ci_validation, actually ran under the bounded validator policy.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 2}} |
| {"mode": "harness_envelope", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"patch artifact ref\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"artifact_ref\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": false\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"boolean\",\n \"default_value\": false,\n \"description\": \"dry run flag\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"dry_run\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 4000,\n \"token_cost_estimate\": 64,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"patch\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": false,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": true,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": true,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"write\",\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": true,\n \"supports_resume\": true\n },\n \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n \"invocation_mode\": \"mutating\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\",\n \"sandbox_rollback_bridge\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"workspace diff\",\n \"evidence_backwrite\": false,\n \"kind\": \"patch\",\n \"name\": \"workspace_diff\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"patch receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": true,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"rolled_back\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"write\",\n \"worktree\",\n \"patch\",\n \"session\"\n ],\n \"blocks_on_conflict\": true,\n \"requires_clean_worktree\": true,\n \"requires_confirmation\": true,\n \"requires_evidence_before_trigger\": true,\n \"risk_band\": \"high\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"partial\",\n \"supports_rollback\": true\n },\n \"summary\": \"Apply a validated patch bundle to the workspace.\",\n \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat apply_patch_bundle as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}} |
| {"mode": "precondition_gating", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run run_ci_validation but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}} |
| {"mode": "worktree_permission", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how run_ci_validation must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether run_ci_validation is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}} |
| {"mode": "argument_shaping", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for run_ci_validation with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}} |
| {"mode": "precondition_gating", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants run_ci_validation immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}} |
| {"mode": "receipt_and_validation", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for run_ci_validation.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}} |
| {"mode": "harness_envelope", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how run_ci_validation behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}} |
| {"mode": "runtime_session", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after run_ci_validation.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}} |
| {"mode": "worktree_permission", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nConstrain run_ci_validation so it respects workspace hygiene, permission gating, and bounded mutation policy.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 1}} |
| {"mode": "tool_trigger", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if run_ci_validation must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}} |
| {"mode": "argument_shaping", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for run_ci_validation so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}} |
| {"mode": "precondition_gating", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nDo not let run_ci_validation or apply_patch_bundle fire when the required preconditions are still missing; defer or repair instead.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 2}} |
| {"mode": "receipt_and_validation", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter run_ci_validation finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}} |
| {"mode": "harness_envelope", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"string\",\n \"default_value\": \"pytest -q\",\n \"description\": \"test selector\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"test_selector\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 8000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Read-only validation tool under workspace / session discipline.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"execution receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"execution_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"validate\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"worktree\",\n \"validate\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat run_ci_validation as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}} |
| {"mode": "self_check_loop", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=self_check_loop\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe model already wrote code; the harness now needs one bounded self-check-and-repair cycle before final submit.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "self_check_loop", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "self_check_loop", "focus": "self_check_loop", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether self_check_repair_loop is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}} |
| {"mode": "argument_shaping", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for self_check_repair_loop with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}} |
| {"mode": "precondition_gating", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run self_check_repair_loop but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}} |
| {"mode": "receipt_and_validation", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for self_check_repair_loop.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}} |
| {"mode": "harness_envelope", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how self_check_repair_loop behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}} |
| {"mode": "runtime_session", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after self_check_repair_loop.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}} |
| {"mode": "worktree_permission", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how self_check_repair_loop must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}} |
| {"mode": "self_check_loop", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=self_check_loop\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA candidate patch exists; decide how the self-check loop should validate, diagnose, and route the next bounded repair step.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "self_check_loop", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "self_check_loop", "focus": "self_check_loop", "split": "train", "variant_rank": 1}} |
| {"mode": "tool_trigger", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if self_check_repair_loop must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}} |
| {"mode": "argument_shaping", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for self_check_repair_loop so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}} |
| {"mode": "precondition_gating", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants self_check_repair_loop immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}} |
| {"mode": "receipt_and_validation", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter self_check_repair_loop finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}} |
| {"mode": "harness_envelope", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to validate\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"entry_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 6000,\n \"token_cost_estimate\": 96,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"validator\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": false,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": true,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"execute\",\n \"validate\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n \"invocation_mode\": \"executing\",\n \"metadata\": {\n \"self_check_loop\": true,\n \"validator_names\": [\n \"sandbox_result_validator\"\n ]\n },\n \"outputs\": [\n {\n \"description\": \"validator receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"validation_receipt\",\n \"name\": \"validator_receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n },\n {\n \"description\": \"bounded failure explanation\",\n \"evidence_backwrite\": false,\n \"kind\": \"text\",\n \"name\": \"failure_report\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"repair\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"execute\",\n \"validate\",\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"medium\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat self_check_repair_loop as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}} |
| {"mode": "reverse_engineering", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=reverse_engineering\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nRepository purpose is unclear; infer architecture, contracts, and dependencies through bounded reverse engineering.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "reverse_engineering", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "reverse_engineering", "focus": "reverse_engineering", "split": "train", "variant_rank": 0}} |
| {"mode": "runtime_session", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after repo_reverse_engineer.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}} |
| {"mode": "tool_trigger", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether repo_reverse_engineer is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}} |
| {"mode": "argument_shaping", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for repo_reverse_engineer with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}} |
| {"mode": "precondition_gating", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run repo_reverse_engineer but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}} |
| {"mode": "receipt_and_validation", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for repo_reverse_engineer.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}} |
| {"mode": "harness_envelope", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how repo_reverse_engineer behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}} |
| {"mode": "runtime_session", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain which session identifiers, receipts, and bounded state packets must survive across a call to repo_reverse_engineer.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 1}} |
| {"mode": "worktree_permission", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how repo_reverse_engineer must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}} |
| {"mode": "reverse_engineering", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=reverse_engineering\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe harness sees an unfamiliar codebase; recover module roles and dependency structure with repository inspection instead of guessing.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "reverse_engineering", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "reverse_engineering", "focus": "reverse_engineering", "split": "train", "variant_rank": 1}} |
| {"mode": "tool_trigger", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if repo_reverse_engineer must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}} |
| {"mode": "argument_shaping", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for repo_reverse_engineer so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}} |
| {"mode": "precondition_gating", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants repo_reverse_engineer immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}} |
| {"mode": "receipt_and_validation", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n \"arguments\": [\n {\n \"arg_type\": \"string\",\n \"default_value\": null,\n \"description\": \"workspace root\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"workspace_root\",\n \"nullable\": false,\n \"path_like\": true,\n \"repeated\": false,\n \"required\": true,\n \"sensitive\": false,\n \"workspace_scoped\": true\n },\n {\n \"arg_type\": \"array\",\n \"default_value\": [],\n \"description\": \"paths to inspect\",\n \"enum_values\": [],\n \"examples\": [],\n \"location\": \"body\",\n \"name\": \"focus_paths\",\n \"nullable\": false,\n \"path_like\": false,\n \"repeated\": false,\n \"required\": false,\n \"sensitive\": false,\n \"workspace_scoped\": false\n }\n ],\n \"budget_hint\": {\n \"network_cost_estimate\": 0,\n \"sandbox_cost_estimate\": 1,\n \"step_cost_estimate\": 1,\n \"time_cost_estimate_ms\": 3500,\n \"token_cost_estimate\": 128,\n \"tool_call_cost_estimate\": 1\n },\n \"capability\": \"search\",\n \"constraints\": {\n \"allowed_isolation_modes\": [],\n \"allowed_path_prefixes\": [],\n \"approval_modes\": [],\n \"auto_mode_allowed\": true,\n \"emits_evidence_ids\": true,\n \"emits_patch_ref\": false,\n \"emits_receipt\": true,\n \"emits_validation_receipt\": false,\n \"forbidden_path_prefixes\": [],\n \"mutates_workspace\": false,\n \"plan_mode_allowed\": true,\n \"required_permissions\": [\n \"worktree\"\n ],\n \"required_task_statuses\": [],\n \"requires_worktree\": true,\n \"supports_compact_boundary\": false,\n \"supports_resume\": true\n },\n \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n \"invocation_mode\": \"read_only\",\n \"metadata\": {\n \"reverse_engineering\": true\n },\n \"outputs\": [\n {\n \"description\": \"bounded repository map\",\n \"evidence_backwrite\": true,\n \"kind\": \"evidence\",\n \"name\": \"repo_map\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": false\n },\n {\n \"description\": \"inspection receipt\",\n \"evidence_backwrite\": false,\n \"kind\": \"execution_receipt\",\n \"name\": \"receipt\",\n \"patch_relevant\": false,\n \"reproducible\": true,\n \"required\": true,\n \"task_output_relevant\": false,\n \"validator_relevant\": true\n }\n ],\n \"phase\": \"execute\",\n \"receipt_policy\": {\n \"include_artifact_refs\": true,\n \"include_budget_charge\": true,\n \"include_evidence_ids\": true,\n \"include_patch_refs\": true,\n \"include_permission_decision\": true,\n \"include_raw_value\": false,\n \"include_task_output_refs\": true,\n \"include_validator_refs\": true,\n \"include_worktree_ref\": true,\n \"receipt_statuses\": [\n \"succeeded\",\n \"failed\",\n \"blocked\"\n ]\n },\n \"risk_profile\": {\n \"allowed_permissions\": [\n \"worktree\",\n \"session\"\n ],\n \"blocks_on_conflict\": false,\n \"requires_clean_worktree\": false,\n \"requires_confirmation\": false,\n \"requires_evidence_before_trigger\": false,\n \"risk_band\": \"low\",\n \"sensitive_domains\": [\n \"workspace\"\n ],\n \"side_effect_level\": \"none\",\n \"supports_rollback\": false\n },\n \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter repo_reverse_engineer finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}} |
|
|