File size: 375,718 Bytes
98746ed
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
{"mode": "argument_shaping", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for browser_search with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}}
{"mode": "harness_envelope", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how browser_search behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether browser_search is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}}
{"mode": "argument_shaping", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for browser_search so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}}
{"mode": "precondition_gating", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run browser_search but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}}
{"mode": "receipt_and_validation", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for browser_search.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}}
{"mode": "harness_envelope", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat browser_search as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}}
{"mode": "runtime_session", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after browser_search.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}}
{"mode": "worktree_permission", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how browser_search must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if browser_search must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}}
{"mode": "argument_shaping", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nDo not shape arguments as if this were repo_reverse_engineer; normalize the request into the strict schema for browser_search only.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 2}}
{"mode": "precondition_gating", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants browser_search immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}}
{"mode": "receipt_and_validation", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter browser_search finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}}
{"mode": "harness_envelope", "tool_name": "browser_search", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"search query\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"query\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"integer\",\n      \"default_value\": 5,\n      \"description\": \"maximum hits\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"top_k\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 1,\n    \"sandbox_cost_estimate\": 0,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 2500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"network\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": false,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Search tool under runtime/network/validator discipline.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"retrieved evidence bundle\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"results\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"search execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"network\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"open_web\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Search public web sources and return evidence candidates.\",\n  \"tool_name\": \"browser_search\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nUnder control-plane priority, explain why browser_search is the bounded move here while run_ci_validation stays subordinate or unused.\n[/USER_QUERY]", "labels": {"tool_name": "browser_search", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 0, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0]}, "metadata": {"tool_name": "browser_search", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 2}}
{"mode": "tool_trigger", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether apply_patch_bundle is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}}
{"mode": "receipt_and_validation", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for apply_patch_bundle.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if apply_patch_bundle must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}}
{"mode": "argument_shaping", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for apply_patch_bundle with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}}
{"mode": "precondition_gating", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run apply_patch_bundle but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}}
{"mode": "receipt_and_validation", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter apply_patch_bundle finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}}
{"mode": "harness_envelope", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how apply_patch_bundle behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}}
{"mode": "runtime_session", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after apply_patch_bundle.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}}
{"mode": "worktree_permission", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how apply_patch_bundle must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nChoose between apply_patch_bundle and run_ci_validation; trigger apply_patch_bundle only if its capability, not the competing tool, matches the bounded task.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 2}}
{"mode": "argument_shaping", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for apply_patch_bundle so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}}
{"mode": "precondition_gating", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants apply_patch_bundle immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}}
{"mode": "receipt_and_validation", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nEmit the receipt fields that prove apply_patch_bundle, not run_ci_validation, actually ran under the bounded validator policy.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 2}}
{"mode": "harness_envelope", "tool_name": "apply_patch_bundle", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"patch artifact ref\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"artifact_ref\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"boolean\",\n      \"default_value\": false,\n      \"description\": \"dry run flag\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"dry_run\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 4000,\n    \"token_cost_estimate\": 64,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"patch\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": false,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": true,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": true,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"write\",\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": true,\n    \"supports_resume\": true\n  },\n  \"description\": \"Mutating patch tool under worktree / snapshot / validator discipline.\",\n  \"invocation_mode\": \"mutating\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\",\n      \"sandbox_rollback_bridge\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"workspace diff\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"patch\",\n      \"name\": \"workspace_diff\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"patch receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": true,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"rolled_back\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"write\",\n      \"worktree\",\n      \"patch\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": true,\n    \"requires_clean_worktree\": true,\n    \"requires_confirmation\": true,\n    \"requires_evidence_before_trigger\": true,\n    \"risk_band\": \"high\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"partial\",\n    \"supports_rollback\": true\n  },\n  \"summary\": \"Apply a validated patch bundle to the workspace.\",\n  \"tool_name\": \"apply_patch_bundle\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat apply_patch_bundle as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "apply_patch_bundle", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 1, "confirmation_required": 1, "session_required": 1, "permission_bits": [0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1]}, "metadata": {"tool_name": "apply_patch_bundle", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}}
{"mode": "precondition_gating", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run run_ci_validation but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}}
{"mode": "worktree_permission", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how run_ci_validation must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether run_ci_validation is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}}
{"mode": "argument_shaping", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for run_ci_validation with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}}
{"mode": "precondition_gating", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants run_ci_validation immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}}
{"mode": "receipt_and_validation", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for run_ci_validation.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}}
{"mode": "harness_envelope", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how run_ci_validation behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}}
{"mode": "runtime_session", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after run_ci_validation.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}}
{"mode": "worktree_permission", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nConstrain run_ci_validation so it respects workspace hygiene, permission gating, and bounded mutation policy.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 1}}
{"mode": "tool_trigger", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if run_ci_validation must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}}
{"mode": "argument_shaping", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for run_ci_validation so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}}
{"mode": "precondition_gating", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nDo not let run_ci_validation or apply_patch_bundle fire when the required preconditions are still missing; defer or repair instead.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 2}}
{"mode": "receipt_and_validation", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter run_ci_validation finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}}
{"mode": "harness_envelope", "tool_name": "run_ci_validation", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": \"pytest -q\",\n      \"description\": \"test selector\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"test_selector\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 8000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Read-only validation tool under workspace / session discipline.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"execution receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"execution_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"validate\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"worktree\",\n      \"validate\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded CI/test validation and emit validator-compatible receipts.\",\n  \"tool_name\": \"run_ci_validation\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat run_ci_validation as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "run_ci_validation", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "run_ci_validation", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}}
{"mode": "self_check_loop", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=self_check_loop\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe model already wrote code; the harness now needs one bounded self-check-and-repair cycle before final submit.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "self_check_loop", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "self_check_loop", "focus": "self_check_loop", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether self_check_repair_loop is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}}
{"mode": "argument_shaping", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for self_check_repair_loop with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}}
{"mode": "precondition_gating", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run self_check_repair_loop but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}}
{"mode": "receipt_and_validation", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for self_check_repair_loop.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}}
{"mode": "harness_envelope", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how self_check_repair_loop behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}}
{"mode": "runtime_session", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after self_check_repair_loop.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}}
{"mode": "worktree_permission", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how self_check_repair_loop must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}}
{"mode": "self_check_loop", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=self_check_loop\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA candidate patch exists; decide how the self-check loop should validate, diagnose, and route the next bounded repair step.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "self_check_loop", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "self_check_loop", "focus": "self_check_loop", "split": "train", "variant_rank": 1}}
{"mode": "tool_trigger", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if self_check_repair_loop must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}}
{"mode": "argument_shaping", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for self_check_repair_loop so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}}
{"mode": "precondition_gating", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants self_check_repair_loop immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}}
{"mode": "receipt_and_validation", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter self_check_repair_loop finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}}
{"mode": "harness_envelope", "tool_name": "self_check_repair_loop", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to validate\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"entry_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 6000,\n    \"token_cost_estimate\": 96,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"validator\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": false,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": true,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"execute\",\n      \"validate\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Self-check loop tool for code-after-generation verification and bounded repair routing.\",\n  \"invocation_mode\": \"executing\",\n  \"metadata\": {\n    \"self_check_loop\": true,\n    \"validator_names\": [\n      \"sandbox_result_validator\"\n    ]\n  },\n  \"outputs\": [\n    {\n      \"description\": \"validator receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"validation_receipt\",\n      \"name\": \"validator_receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    },\n    {\n      \"description\": \"bounded failure explanation\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"text\",\n      \"name\": \"failure_report\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"repair\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"execute\",\n      \"validate\",\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"medium\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Run bounded self-check, diagnose the failed constraint, and prepare the next repair step.\",\n  \"tool_name\": \"self_check_repair_loop\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nTreat self_check_repair_loop as one step inside the full VeriLoop harness; describe the obedient bounded behavior rather than general coding ability.\n[/USER_QUERY]", "labels": {"tool_name": "self_check_repair_loop", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 1, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0]}, "metadata": {"tool_name": "self_check_repair_loop", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 1}}
{"mode": "reverse_engineering", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=reverse_engineering\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nRepository purpose is unclear; infer architecture, contracts, and dependencies through bounded reverse engineering.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "reverse_engineering", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "reverse_engineering", "focus": "reverse_engineering", "split": "train", "variant_rank": 0}}
{"mode": "runtime_session", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nState the runtime references that must remain continuous before and after repo_reverse_engineer.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 0}}
{"mode": "tool_trigger", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nGiven the bounded runtime contract, decide whether repo_reverse_engineer is the legal next action instead of narration.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 0}}
{"mode": "argument_shaping", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nProduce a contract-compliant argument object for repo_reverse_engineer with typed fields only.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 0}}
{"mode": "precondition_gating", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe user asks to run repo_reverse_engineer but permissions, evidence, or worktree preconditions are incomplete.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 0}}
{"mode": "receipt_and_validation", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nReturn the expected receipt and validator-facing structure for repo_reverse_engineer.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 0}}
{"mode": "harness_envelope", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=harness_envelope\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nIn a long-running harness loop, decide how repo_reverse_engineer behaves under planner, validator, and runtime constraints.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "harness_envelope", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "harness_envelope", "focus": "harness_envelope", "split": "train", "variant_rank": 0}}
{"mode": "runtime_session", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=runtime_session\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain which session identifiers, receipts, and bounded state packets must survive across a call to repo_reverse_engineer.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "runtime_session", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "runtime_session", "focus": "runtime_session", "split": "train", "variant_rank": 1}}
{"mode": "worktree_permission", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=worktree_permission\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nExplain how repo_reverse_engineer must obey worktree and permission boundaries.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "worktree_permission", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "worktree_permission", "focus": "worktree_permission", "split": "train", "variant_rank": 0}}
{"mode": "reverse_engineering", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=reverse_engineering\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe harness sees an unfamiliar codebase; recover module roles and dependency structure with repository inspection instead of guessing.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "reverse_engineering", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "reverse_engineering", "focus": "reverse_engineering", "split": "train", "variant_rank": 1}}
{"mode": "tool_trigger", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=trigger\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nThe agent is tempted to answer directly; determine if repo_reverse_engineer must be triggered under the typed envelope.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "tool_trigger", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "tool_trigger", "focus": "trigger", "split": "train", "variant_rank": 1}}
{"mode": "argument_shaping", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=arguments\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nShape the exact bounded payload for repo_reverse_engineer so the runtime validator accepts it on the first pass.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "argument_shaping", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "argument_shaping", "focus": "arguments", "split": "train", "variant_rank": 1}}
{"mode": "precondition_gating", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=precondition_gating\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nA caller wants repo_reverse_engineer immediately, yet the validator envelope shows missing prerequisites; choose the bounded next step.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "precondition_gating", "trigger": 0, "schema_ok": 0, "precondition_ok": 0, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "precondition_gating", "focus": "precondition_gating", "split": "train", "variant_rank": 1}}
{"mode": "receipt_and_validation", "tool_name": "repo_reverse_engineer", "user_query": "[HARNESS_ENVELOPE]\nrole=generator\nruntime_protocol=true\ntyped_tool_contracts=true\nvalidator_alignment=true\nsession_continuity=true\npermission_alignment=true\nworktree_discipline=true\nrepair_after_self_check=true\nreverse_engineering_ready=true\nrule=Do not emit free-form tool fantasies. Follow the typed tool contract exactly.\nrule=If preconditions are not satisfied, defer, repair, or ask for the next bounded step.\nrule=Validator receipts and runtime permissions outrank narration.\nrule=If code is produced, the harness may still call a bounded self-check loop before final submit.\nrule=When repository intent is unclear, reverse-engineering and repository inspection are valid bounded actions.\ncontract_focus=receipt_validation\n[/HARNESS_ENVELOPE]\n\n[TOOL_SPEC]\n{\n  \"arguments\": [\n    {\n      \"arg_type\": \"string\",\n      \"default_value\": null,\n      \"description\": \"workspace root\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"workspace_root\",\n      \"nullable\": false,\n      \"path_like\": true,\n      \"repeated\": false,\n      \"required\": true,\n      \"sensitive\": false,\n      \"workspace_scoped\": true\n    },\n    {\n      \"arg_type\": \"array\",\n      \"default_value\": [],\n      \"description\": \"paths to inspect\",\n      \"enum_values\": [],\n      \"examples\": [],\n      \"location\": \"body\",\n      \"name\": \"focus_paths\",\n      \"nullable\": false,\n      \"path_like\": false,\n      \"repeated\": false,\n      \"required\": false,\n      \"sensitive\": false,\n      \"workspace_scoped\": false\n    }\n  ],\n  \"budget_hint\": {\n    \"network_cost_estimate\": 0,\n    \"sandbox_cost_estimate\": 1,\n    \"step_cost_estimate\": 1,\n    \"time_cost_estimate_ms\": 3500,\n    \"token_cost_estimate\": 128,\n    \"tool_call_cost_estimate\": 1\n  },\n  \"capability\": \"search\",\n  \"constraints\": {\n    \"allowed_isolation_modes\": [],\n    \"allowed_path_prefixes\": [],\n    \"approval_modes\": [],\n    \"auto_mode_allowed\": true,\n    \"emits_evidence_ids\": true,\n    \"emits_patch_ref\": false,\n    \"emits_receipt\": true,\n    \"emits_validation_receipt\": false,\n    \"forbidden_path_prefixes\": [],\n    \"mutates_workspace\": false,\n    \"plan_mode_allowed\": true,\n    \"required_permissions\": [\n      \"worktree\"\n    ],\n    \"required_task_statuses\": [],\n    \"requires_worktree\": true,\n    \"supports_compact_boundary\": false,\n    \"supports_resume\": true\n  },\n  \"description\": \"Repository reverse-engineering tool for code understanding, dependency tracing, and intent recovery.\",\n  \"invocation_mode\": \"read_only\",\n  \"metadata\": {\n    \"reverse_engineering\": true\n  },\n  \"outputs\": [\n    {\n      \"description\": \"bounded repository map\",\n      \"evidence_backwrite\": true,\n      \"kind\": \"evidence\",\n      \"name\": \"repo_map\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": false\n    },\n    {\n      \"description\": \"inspection receipt\",\n      \"evidence_backwrite\": false,\n      \"kind\": \"execution_receipt\",\n      \"name\": \"receipt\",\n      \"patch_relevant\": false,\n      \"reproducible\": true,\n      \"required\": true,\n      \"task_output_relevant\": false,\n      \"validator_relevant\": true\n    }\n  ],\n  \"phase\": \"execute\",\n  \"receipt_policy\": {\n    \"include_artifact_refs\": true,\n    \"include_budget_charge\": true,\n    \"include_evidence_ids\": true,\n    \"include_patch_refs\": true,\n    \"include_permission_decision\": true,\n    \"include_raw_value\": false,\n    \"include_task_output_refs\": true,\n    \"include_validator_refs\": true,\n    \"include_worktree_ref\": true,\n    \"receipt_statuses\": [\n      \"succeeded\",\n      \"failed\",\n      \"blocked\"\n    ]\n  },\n  \"risk_profile\": {\n    \"allowed_permissions\": [\n      \"worktree\",\n      \"session\"\n    ],\n    \"blocks_on_conflict\": false,\n    \"requires_clean_worktree\": false,\n    \"requires_confirmation\": false,\n    \"requires_evidence_before_trigger\": false,\n    \"risk_band\": \"low\",\n    \"sensitive_domains\": [\n      \"workspace\"\n    ],\n    \"side_effect_level\": \"none\",\n    \"supports_rollback\": false\n  },\n  \"summary\": \"Inspect repository structure, infer missing intent, and reconstruct bounded architecture facts.\",\n  \"tool_name\": \"repo_reverse_engineer\"\n}\n[/TOOL_SPEC]\n\n[USER_QUERY]\nAfter repo_reverse_engineer finishes, format the execution and validation receipts so the harness can audit them deterministically.\n[/USER_QUERY]", "labels": {"tool_name": "repo_reverse_engineer", "mode_name": "receipt_and_validation", "trigger": 1, "schema_ok": 1, "precondition_ok": 1, "validator_required": 0, "worktree_required": 1, "rollback_supported": 0, "confirmation_required": 0, "session_required": 1, "permission_bits": [0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0]}, "metadata": {"tool_name": "repo_reverse_engineer", "mode": "receipt_and_validation", "focus": "receipt_validation", "split": "train", "variant_rank": 1}}