ConorWang commited on
Commit
05bba4d
·
verified ·
1 Parent(s): f78e79b

Delete toolspec_adapter_train_result.json

Browse files
Files changed (1) hide show
  1. toolspec_adapter_train_result.json +0 -299
toolspec_adapter_train_result.json DELETED
@@ -1,299 +0,0 @@
1
- {
2
- "artifacts": {
3
- "adapter_dir": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/adapter",
4
- "best_checkpoint_manifest": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/best_checkpoint_manifest.json",
5
- "epoch_history": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/epoch_history.json",
6
- "eval_jsonl": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/toolspec_eval.jsonl",
7
- "host_manifest": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/host_manifest.json",
8
- "plan_json": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/toolspec_adapter_plan.json",
9
- "probe_head": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/toolspec_probe_head.pt",
10
- "tokenizer_dir": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/tokenizer",
11
- "train_jsonl": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/toolspec_train.jsonl",
12
- "training_manifest": "/private/wang_libo/veriloop_coder_e1/outputs/toolspec_qwen36_rootfix_run1/toolspec_training_manifest.json"
13
- },
14
- "dataset": {
15
- "eval_size": 25,
16
- "modes": [
17
- "argument_shaping",
18
- "harness_envelope",
19
- "precondition_gating",
20
- "receipt_and_validation",
21
- "reverse_engineering",
22
- "runtime_session",
23
- "self_check_loop",
24
- "tool_trigger",
25
- "worktree_permission"
26
- ],
27
- "tools": [
28
- "apply_patch_bundle",
29
- "browser_search",
30
- "repo_reverse_engineer",
31
- "run_ci_validation",
32
- "self_check_repair_loop"
33
- ],
34
- "train_size": 70
35
- },
36
- "eval_metrics": {
37
- "adapter_exported": true,
38
- "auto_lora_from_ia3": false,
39
- "avg_binary_accuracy": 0.81,
40
- "best_epoch": 4,
41
- "best_quality_score": 0.46349615617231893,
42
- "confirmation_required_accuracy": 0.8,
43
- "count": 25,
44
- "eval_batches": 25,
45
- "eval_loss": 6.897225952148437,
46
- "mode_accuracy": 0.56,
47
- "peft_method": "lora_narrow",
48
- "permission_bit_accuracy": 0.8545454545454545,
49
- "precondition_ok_accuracy": 0.76,
50
- "quality_score": 0.46349615617231893,
51
- "rollback_supported_accuracy": 0.8,
52
- "schema_ok_accuracy": 0.76,
53
- "session_required_accuracy": 1.0,
54
- "tool_accuracy": 0.44,
55
- "trigger_accuracy": 0.76,
56
- "used_peft": true,
57
- "validator_required_accuracy": 0.8,
58
- "worktree_required_accuracy": 0.8
59
- },
60
- "plan": {
61
- "backbone": "/public/wang_libo/veriloop_coder_e1/model",
62
- "dataset_summary": {
63
- "eval_size": 25,
64
- "modes": [
65
- "argument_shaping",
66
- "harness_envelope",
67
- "precondition_gating",
68
- "receipt_and_validation",
69
- "reverse_engineering",
70
- "runtime_session",
71
- "self_check_loop",
72
- "tool_trigger",
73
- "worktree_permission"
74
- ],
75
- "tools": [
76
- "apply_patch_bundle",
77
- "browser_search",
78
- "repo_reverse_engineer",
79
- "run_ci_validation",
80
- "self_check_repair_loop"
81
- ],
82
- "train_size": 70
83
- },
84
- "excluded_surfaces": [
85
- "(^|\\.)lm_head($|\\.)::Do not retune final token head; too broad and evaluation-heavy.",
86
- "(^|\\.)embed_tokens($|\\.)::Embedding surgery risks broad semantic drift.",
87
- "(^|\\.)norm($|\\.)::Global norm tuning can destabilize calibration across scenes.",
88
- "attnres|attention_residual::Block AttnRes may be mounted structurally but is never a PEFT target.",
89
- "dualpath::DualPath is serving/runtime infrastructure only.",
90
- "mhc|hyper[-_]?connection::mHC-inspired stability hooks remain structural, not PEFT surfaces.",
91
- "rope|rotary::RoPE/context surgery is handled architecturally, not by narrow PEFT here.",
92
- "kvcache|kv_cache::KV-cache runtime surfaces are not PEFT targets.",
93
- "(^|\\.)memory(_store|_bank)?($|\\.)::Persistent memory stores are harness/runtime policy surfaces, not PEFT targets."
94
- ],
95
- "notes": [
96
- "Primary route is host-surface-first toolspec probe training, not broad coding SFT.",
97
- "This adapter is allowed to shape runtime protocol obedience, validator alignment, self-check willingness, and reverse-engineering readiness.",
98
- "Backbone attention, MoE router/expert weights, DualPath, Block AttnRes, and mHC remain excluded.",
99
- "Explicit host/runtime bridge leaves default to LoRA-narrow attachment because IA3 feedforward constraints do not fit this custom side-car surface design."
100
- ],
101
- "peft_method": "lora_narrow",
102
- "product_line": "veriloop_coder",
103
- "recipe": {
104
- "adapter_family": "runtime_harness",
105
- "backbone": "/public/wang_libo/veriloop_coder_e1/model",
106
- "backbone_family": "qwen_dense",
107
- "excluded_patterns": [
108
- "(?i)\\bdualpath\\b",
109
- "(?i)\\bmhc\\b",
110
- "(?i)\\bfull[_\\- ]?attnres\\b",
111
- "(?i)\\battnres(_full)?\\b",
112
- "(?i)\\brouter\\b",
113
- "(?i)\\bexperts?\\b",
114
- "(?i)\\bmoe\\b.*\\b(gate|router|expert)\\b",
115
- "(?i)\\brope\\b.*\\b(freq|inv_freq|theta|rotary)\\b",
116
- "(?i)\\bkvcache\\b",
117
- "(?i)\\bposition_embedding\\b",
118
- "(?i)\\bembed(tokens|ding)?\\b",
119
- "(?i)\\blm_head\\b"
120
- ],
121
- "harness_constraints": [
122
- "Harness Engineering remains the primary convergence layer.",
123
- "Adapter must not bypass runtime orchestrator / validator / rollback loops.",
124
- "Adapter outputs remain subordinate to VeriLoop control-plane decisions.",
125
- "Adapter must not create hidden prompt-style memory authority.",
126
- "Adapter must improve runtime protocol obedience, not free-form style drift.",
127
- "Tool legality, permission discipline, session continuity, and worktree hygiene must remain first-class."
128
- ],
129
- "hyperparams": {
130
- "alpha": 0,
131
- "bias": "none",
132
- "dropout": 0.0,
133
- "fan_in_fan_out": false,
134
- "modules_to_save": [],
135
- "r": 0,
136
- "task_type": "CAUSAL_LM"
137
- },
138
- "merge_policy": "side_load",
139
- "metadata": {
140
- "allow_backbone_bridge": false,
141
- "allow_vla_action_expert": false,
142
- "harness_first": true,
143
- "prefer_explicit_heads": true,
144
- "prefer_qlora_for_backbone_bridge": true,
145
- "require_harness_first": true,
146
- "selector_group_count": 2,
147
- "strict_narrow_scope": true,
148
- "toolspec_probe_training": true,
149
- "trainer": "veriloop.toolspec_adapter_trainer.v5.qwen36"
150
- },
151
- "notes": [
152
- "Harness Engineering is primary; PEFT is limited to obedience-facing, interface-facing support surfaces.",
153
- "Backbone bridge tuning disabled explicitly; selector stays on custom surfaces or no-op.",
154
- "Backbone family inferred as qwen_dense.",
155
- "PEFT method resolved as ia3_head_only.",
156
- "Recipe is harness-first: runtime convergence remains in VeriLoop control-plane + harness, not in broad weight surgery.",
157
- "Block AttnRes, DualPath, mHC hooks, RoPE, KV-cache, and broad MoE routing remain structurally excluded."
158
- ],
159
- "peft_method": "lora_narrow",
160
- "precision_policy": "auto",
161
- "product_line": "veriloop_coder",
162
- "regression_requirements": [
163
- "Must pass PEFT regression guard structural policy checks.",
164
- "Must not introduce forbidden backbone/serving structural targets.",
165
- "Must preserve harness regression envelope for the selected product line.",
166
- "Runtime protocol obedience must improve or hold.",
167
- "Tool trigger accuracy, permission discipline, and worktree continuity must not regress."
168
- ],
169
- "target_groups": [
170
- {
171
- "alpha": 16,
172
- "dropout": 0.05,
173
- "name": "group_1_custom_runtime_harness_bridge",
174
- "rank": 8,
175
- "rationale": "Runtime / harness obedience should attach to explicit interface bridges before any backbone fallback.",
176
- "surface": "custom_runtime_harness_bridge",
177
- "target_modules": [
178
- "failure_signal_bridge.rollback_bridge",
179
- "request_normalizer",
180
- "request_normalizer.adapter",
181
- "rollback_adapter",
182
- "rollback_adapter.head",
183
- "runtime_harness_adapter",
184
- "runtime_harness_adapter.bridge",
185
- "tool_protocol_adapter",
186
- "tool_protocol_adapter.bridge",
187
- "toolspec_bridge",
188
- "toolspec_bridge.adapter",
189
- "toolspec_head",
190
- "toolspec_head.param_schema_adapter",
191
- "toolspec_head.postcondition_adapter",
192
- "toolspec_head.precondition_adapter",
193
- "toolspec_head.receipt_formatter",
194
- "toolspec_head.trigger_gate",
195
- "toolspec_head.validator_gate",
196
- "validator_feedback_loop.rollback_adapter"
197
- ]
198
- },
199
- {
200
- "alpha": 8,
201
- "dropout": 0.0,
202
- "name": "group_2_custom_memory_boundary_bridge",
203
- "rank": 4,
204
- "rationale": "Session continuity should bind to boundary-aware memory packet surfaces rather than broad backbone tuning.",
205
- "surface": "custom_memory_boundary_bridge",
206
- "target_modules": [
207
- "episodic_memory",
208
- "episodic_memory.adapter",
209
- "memory_boundary_guard",
210
- "memory_boundary_guard.adapter",
211
- "memory_boundary_guard.rollback_filter",
212
- "session_compactor",
213
- "session_compactor.adapter"
214
- ]
215
- }
216
- ],
217
- "target_modules": [
218
- "failure_signal_bridge.rollback_bridge",
219
- "request_normalizer",
220
- "request_normalizer.adapter",
221
- "rollback_adapter",
222
- "rollback_adapter.head",
223
- "runtime_harness_adapter",
224
- "runtime_harness_adapter.bridge",
225
- "tool_protocol_adapter",
226
- "tool_protocol_adapter.bridge",
227
- "toolspec_bridge",
228
- "toolspec_bridge.adapter",
229
- "toolspec_head",
230
- "toolspec_head.param_schema_adapter",
231
- "toolspec_head.postcondition_adapter",
232
- "toolspec_head.precondition_adapter",
233
- "toolspec_head.receipt_formatter",
234
- "toolspec_head.trigger_gate",
235
- "toolspec_head.validator_gate",
236
- "validator_feedback_loop.rollback_adapter",
237
- "episodic_memory",
238
- "episodic_memory.adapter",
239
- "memory_boundary_guard",
240
- "memory_boundary_guard.adapter",
241
- "memory_boundary_guard.rollback_filter",
242
- "session_compactor",
243
- "session_compactor.adapter"
244
- ],
245
- "version": "veriloop.lora_recipe_veriloop.v2"
246
- },
247
- "selected_surfaces": [
248
- "custom_runtime_harness_bridge",
249
- "custom_validator_bridge",
250
- "custom_memory_boundary_bridge"
251
- ],
252
- "selected_target_modules": [
253
- "request_normalizer",
254
- "request_normalizer.adapter",
255
- "runtime_harness_adapter",
256
- "runtime_harness_adapter.bridge",
257
- "tool_protocol_adapter",
258
- "tool_protocol_adapter.bridge",
259
- "toolspec_bridge",
260
- "toolspec_bridge.adapter",
261
- "toolspec_head",
262
- "toolspec_head.param_schema_adapter",
263
- "toolspec_head.postcondition_adapter",
264
- "toolspec_head.precondition_adapter",
265
- "toolspec_head.receipt_formatter",
266
- "toolspec_head.trigger_gate",
267
- "toolspec_head.validator_gate",
268
- "validator_feedback_bridge",
269
- "validator_feedback_bridge.adapter"
270
- ],
271
- "selection_mode": "minimal",
272
- "version": "veriloop.toolspec_adapter_trainer.v5.qwen36",
273
- "warnings": [
274
- "Harness Engineering is primary; PEFT is limited to obedience-facing, interface-facing support surfaces.",
275
- "Backbone bridge tuning disabled explicitly; selector stays on custom surfaces or no-op."
276
- ]
277
- },
278
- "status": "trained",
279
- "train_metrics": {
280
- "adapter_exported": true,
281
- "auto_lora_from_ia3": false,
282
- "best_epoch": 4,
283
- "best_quality_score": 0.46349615617231893,
284
- "epochs_completed": 5,
285
- "loss": 0.42175399448190415,
286
- "micro_batches": 70,
287
- "micro_batches_total": 350,
288
- "optimizer_steps": 5,
289
- "optimizer_steps_total": 25,
290
- "peft_method": "lora_narrow",
291
- "used_peft": true
292
- },
293
- "version": "veriloop.toolspec_adapter_trainer.v5.qwen36",
294
- "warnings": [
295
- "Harness Engineering is primary; PEFT is limited to obedience-facing, interface-facing support surfaces.",
296
- "Backbone bridge tuning disabled explicitly; selector stays on custom surfaces or no-op.",
297
- "Synthetic holdout split used for quality-oriented train/eval separation."
298
- ]
299
- }