ConorWang commited on
Commit
10d30bd
·
verified ·
1 Parent(s): 05bba4d

Delete uncertainty_adapter_plan.json

Browse files
Files changed (1) hide show
  1. uncertainty_adapter_plan.json +0 -469
uncertainty_adapter_plan.json DELETED
@@ -1,469 +0,0 @@
1
- {
2
- "adapter_alpha": 16,
3
- "adapter_dropout": 0.05,
4
- "adapter_rank": 8,
5
- "backbone_manifest": {
6
- "host_inventory_size": 79
7
- },
8
- "config": {
9
- "allow_backbone_bridge": false,
10
- "backbone": "/public/wang_libo/veriloop_coder_e1/model",
11
- "bf16": true,
12
- "cache_dir": null,
13
- "cpu_max_memory_gib": 96,
14
- "dataset_jsonl": null,
15
- "dim_weights": {
16
- "u_answer": 1.1,
17
- "u_evidence": 1.35,
18
- "u_exec": 1.35,
19
- "u_risk": 1.55,
20
- "u_spec": 1.25
21
- },
22
- "early_stopping_min_delta": 0.001,
23
- "early_stopping_patience": 2,
24
- "enable_synthetic_dataset": true,
25
- "eval_jsonl": null,
26
- "eval_samples_per_mode": 5,
27
- "fp16": false,
28
- "gpu_max_memory_gib": 44,
29
- "gradient_accumulation_steps": 16,
30
- "host_dropout": 0.0,
31
- "learning_rate": 2e-05,
32
- "local_files_only": true,
33
- "logging_steps": 10,
34
- "max_grad_norm": 1.0,
35
- "max_length": 1664,
36
- "min_epochs_before_early_stop": 2,
37
- "num_train_epochs": 4.0,
38
- "output_dir": "./outputs/uncertainty_qwen36_rootfix_run1",
39
- "per_device_eval_batch_size": 1,
40
- "per_device_train_batch_size": 1,
41
- "prefer_best_checkpoint_export": true,
42
- "probe_dropout": 0.03,
43
- "probe_hidden_factor": 0.75,
44
- "product_line": "veriloop_coder",
45
- "quantization_mode": "4bit",
46
- "quantization_required": false,
47
- "require_trainable_targets": true,
48
- "revision": null,
49
- "run_post_train_eval": true,
50
- "save_best_checkpoint": true,
51
- "seed": 11,
52
- "selection_mode": "minimal",
53
- "train_samples_per_mode": 14,
54
- "training_mode": "mounted_head",
55
- "trust_remote_code": true,
56
- "use_double_quant": true,
57
- "warmup_ratio": 0.05,
58
- "weight_decay": 0.0,
59
- "weighted_mae_penalty": 0.5,
60
- "weighted_rmse_penalty": 0.5
61
- },
62
- "dataset_summary": {
63
- "eval_modes": {
64
- "conflicting_evidence": 5,
65
- "evidence_gap": 5,
66
- "exec_required": 5,
67
- "high_risk": 5,
68
- "low_uncertainty": 5,
69
- "patch_pending": 5,
70
- "reverse_engineering_ambiguity": 5,
71
- "self_check_failure": 5,
72
- "spec_mismatch": 5,
73
- "validator_negation": 5,
74
- "worktree_conflict": 5
75
- },
76
- "eval_size": 55,
77
- "train_modes": {
78
- "conflicting_evidence": 14,
79
- "evidence_gap": 14,
80
- "exec_required": 14,
81
- "high_risk": 14,
82
- "low_uncertainty": 14,
83
- "patch_pending": 14,
84
- "reverse_engineering_ambiguity": 14,
85
- "self_check_failure": 14,
86
- "spec_mismatch": 14,
87
- "validator_negation": 14,
88
- "worktree_conflict": 14
89
- },
90
- "train_size": 154
91
- },
92
- "head_strategy": "host_head",
93
- "notes": [
94
- "Primary route is host-surface-first uncertainty training.",
95
- "Validator receipts, self-check failure, reverse-engineering ambiguity, worktree conflicts, and patch continuity are first-class signals.",
96
- "DualPath, Full AttnRes, mHC, routers, experts, and broad attention-layer PEFT stay excluded.",
97
- "This adapter should improve runtime uncertainty routing, not general coding free-formity."
98
- ],
99
- "peft_method": "lora_narrow",
100
- "recipe": {
101
- "adapter_family": "uncertainty",
102
- "backbone": "/public/wang_libo/veriloop_coder_e1/model",
103
- "backbone_family": "qwen_dense",
104
- "excluded_patterns": [
105
- "(?i)\\bdualpath\\b",
106
- "(?i)\\bmhc\\b",
107
- "(?i)\\bfull[_\\- ]?attnres\\b",
108
- "(?i)\\battnres(_full)?\\b",
109
- "(?i)\\brouter\\b",
110
- "(?i)\\bexperts?\\b",
111
- "(?i)\\bmoe\\b.*\\b(gate|router|expert)\\b",
112
- "(?i)\\brope\\b.*\\b(freq|inv_freq|theta|rotary)\\b",
113
- "(?i)\\bkvcache\\b",
114
- "(?i)\\bposition_embedding\\b",
115
- "(?i)\\bembed(tokens|ding)?\\b",
116
- "(?i)\\blm_head\\b"
117
- ],
118
- "harness_constraints": [
119
- "Harness Engineering remains the primary convergence layer.",
120
- "Adapter must not bypass runtime orchestrator / validator / rollback loops.",
121
- "Adapter outputs remain subordinate to VeriLoop control-plane decisions.",
122
- "Adapter must not create hidden prompt-style memory authority.",
123
- "Adapter must support bounded uncertainty calibration rather than generic hesitation.",
124
- "Validator and receipt evidence must remain able to update uncertainty."
125
- ],
126
- "hyperparams": {
127
- "alpha": 16,
128
- "bias": "none",
129
- "dropout": 0.05,
130
- "fan_in_fan_out": false,
131
- "modules_to_save": [
132
- "input_layernorm"
133
- ],
134
- "r": 8,
135
- "task_type": "CAUSAL_LM"
136
- },
137
- "merge_policy": "merge_after_guard",
138
- "metadata": {
139
- "allow_backbone_bridge": false,
140
- "allow_vla_action_expert": false,
141
- "harness_first": true,
142
- "prefer_explicit_heads": true,
143
- "prefer_qlora_for_backbone_bridge": true,
144
- "require_harness_first": true,
145
- "selector_group_count": 2,
146
- "strict_narrow_scope": true,
147
- "trainer": "veriloop.uncertainty_adapter_trainer.v5.qwen36",
148
- "uncertainty_training": true
149
- },
150
- "notes": [
151
- "Backbone bridge tuning disabled explicitly; selector stays on custom surfaces or no-op.",
152
- "Backbone family inferred as qwen_dense.",
153
- "PEFT method resolved as lora_narrow.",
154
- "Recipe is harness-first: runtime convergence remains in VeriLoop control-plane + harness, not in broad weight surgery.",
155
- "Block AttnRes, DualPath, mHC hooks, RoPE, KV-cache, and broad MoE routing remain structurally excluded."
156
- ],
157
- "peft_method": "lora_narrow",
158
- "precision_policy": "auto",
159
- "product_line": "veriloop_coder",
160
- "regression_requirements": [
161
- "Must pass PEFT regression guard structural policy checks.",
162
- "Must not introduce forbidden backbone/serving structural targets.",
163
- "Must preserve harness regression envelope for the selected product line.",
164
- "Budgeted uncertainty convergence must not regress.",
165
- "Uncertainty calibration must not collapse into generic caution."
166
- ],
167
- "target_groups": [
168
- {
169
- "alpha": 16,
170
- "dropout": 0.0,
171
- "name": "group_1_custom_control_head",
172
- "rank": 8,
173
- "rationale": "Prefer explicit uncertainty / calibration heads over backbone surgery.",
174
- "surface": "custom_control_head",
175
- "target_modules": [
176
- "uncertainty_head",
177
- "uncertainty_head.calibration_mlp",
178
- "uncertainty_head.proj"
179
- ]
180
- },
181
- {
182
- "alpha": 16,
183
- "dropout": 0.0,
184
- "name": "group_2_custom_validator_bridge",
185
- "rank": 8,
186
- "rationale": "Validation and rollback fidelity should prefer explicit validator / rollback bridges.",
187
- "surface": "custom_validator_bridge",
188
- "target_modules": [
189
- "failure_signal_bridge",
190
- "failure_signal_bridge.rollback_bridge",
191
- "rollback_adapter",
192
- "rollback_adapter.head",
193
- "sandbox_rollback_bridge",
194
- "sandbox_rollback_bridge.adapter",
195
- "validator_feedback_bridge",
196
- "validator_feedback_bridge.adapter",
197
- "validator_feedback_loop.rollback_adapter"
198
- ]
199
- }
200
- ],
201
- "target_modules": [
202
- "uncertainty_head",
203
- "uncertainty_head.calibration_mlp",
204
- "uncertainty_head.proj",
205
- "failure_signal_bridge",
206
- "failure_signal_bridge.rollback_bridge",
207
- "rollback_adapter",
208
- "rollback_adapter.head",
209
- "sandbox_rollback_bridge",
210
- "sandbox_rollback_bridge.adapter",
211
- "validator_feedback_bridge",
212
- "validator_feedback_bridge.adapter",
213
- "validator_feedback_loop.rollback_adapter"
214
- ],
215
- "version": "veriloop.lora_recipe_veriloop.v2"
216
- },
217
- "selected_target_modules": [
218
- "uncertainty_head",
219
- "uncertainty_head.calibration_mlp",
220
- "uncertainty_head.proj"
221
- ],
222
- "target_selection": {
223
- "backbone_archetype": "qwen_dense",
224
- "exclusions": [
225
- {
226
- "pattern": "(^|\\.)lm_head($|\\.)",
227
- "reason": "Do not retune final token head; too broad and evaluation-heavy."
228
- },
229
- {
230
- "pattern": "(^|\\.)embed_tokens($|\\.)",
231
- "reason": "Embedding surgery risks broad semantic drift."
232
- },
233
- {
234
- "pattern": "(^|\\.)norm($|\\.)",
235
- "reason": "Global norm tuning can destabilize calibration across scenes."
236
- },
237
- {
238
- "pattern": "attnres|attention_residual",
239
- "reason": "Block AttnRes may be mounted structurally but is never a PEFT target."
240
- },
241
- {
242
- "pattern": "dualpath",
243
- "reason": "DualPath is serving/runtime infrastructure only."
244
- },
245
- {
246
- "pattern": "mhc|hyper[-_]?connection",
247
- "reason": "mHC-inspired stability hooks remain structural, not PEFT surfaces."
248
- },
249
- {
250
- "pattern": "rope|rotary",
251
- "reason": "RoPE/context surgery is handled architecturally, not by narrow PEFT here."
252
- },
253
- {
254
- "pattern": "kvcache|kv_cache",
255
- "reason": "KV-cache runtime surfaces are not PEFT targets."
256
- },
257
- {
258
- "pattern": "(^|\\.)memory(_store|_bank)?($|\\.)",
259
- "reason": "Persistent memory stores are harness/runtime policy surfaces, not PEFT targets."
260
- }
261
- ],
262
- "inventory_size": 79,
263
- "inventory_source": "provided_names",
264
- "notes": [
265
- "Harness Engineering is primary; PEFT is limited to obedience-facing, interface-facing support surfaces.",
266
- "Backbone bridge tuning disabled explicitly; selector stays on custom surfaces or no-op."
267
- ],
268
- "recommended_training": "ia3_head_only",
269
- "request": {
270
- "allow_backbone_bridge": false,
271
- "allow_vla_action_expert": false,
272
- "backbone": "/public/wang_libo/veriloop_coder_e1/model",
273
- "explicit_exclude_patterns": [],
274
- "explicit_include_patterns": [],
275
- "intents": [
276
- "uncertainty",
277
- "validator_alignment",
278
- "harness_alignment",
279
- "runtime_protocol",
280
- "session_continuity",
281
- "worktree_discipline"
282
- ],
283
- "prefer_qlora_for_backbone_bridge": true,
284
- "product_line": "veriloop_coder",
285
- "selection_mode": "minimal"
286
- },
287
- "selected_groups": [
288
- {
289
- "alpha": 16,
290
- "dropout": 0.0,
291
- "exclude_patterns": [
292
- "(^|\\.)lm_head($|\\.)",
293
- "(^|\\.)embed_tokens($|\\.)",
294
- "(^|\\.)norm($|\\.)",
295
- "attnres|attention_residual",
296
- "dualpath",
297
- "mhc|hyper[-_]?connection",
298
- "rope|rotary",
299
- "kvcache|kv_cache",
300
- "(^|\\.)memory(_store|_bank)?($|\\.)"
301
- ],
302
- "include_patterns": [
303
- "(^|\\.)(uncertainty_head|uncertainty_adapter|calib(_head|ration_adapter)?)($|\\.)"
304
- ],
305
- "intents": [
306
- "uncertainty"
307
- ],
308
- "layer_window": {
309
- "mode": "all",
310
- "value": 0.0
311
- },
312
- "matched_module_names": [
313
- "uncertainty_head",
314
- "uncertainty_head.calibration_mlp",
315
- "uncertainty_head.proj"
316
- ],
317
- "name": "group_1_custom_control_head",
318
- "rank": 8,
319
- "rationale": "Prefer explicit uncertainty / calibration heads over backbone surgery.",
320
- "risk": "low",
321
- "surface": "custom_control_head"
322
- },
323
- {
324
- "alpha": 16,
325
- "dropout": 0.05,
326
- "exclude_patterns": [
327
- "(^|\\.)lm_head($|\\.)",
328
- "(^|\\.)embed_tokens($|\\.)",
329
- "(^|\\.)norm($|\\.)",
330
- "attnres|attention_residual",
331
- "dualpath",
332
- "mhc|hyper[-_]?connection",
333
- "rope|rotary",
334
- "kvcache|kv_cache",
335
- "(^|\\.)memory(_store|_bank)?($|\\.)"
336
- ],
337
- "include_patterns": [
338
- "(^|\\.)(runtime_harness|query_runtime|task_brief|task_runtime|tool_protocol|permission_context|worktree|session_state|request_normalizer|action_allowlist|constraint_guard|progress_state|workspace_snapshot|repo_contract|knowledge_entry|completion_criteria|search_bridge|sandbox_search_bridge)(_adapter|_bridge|_head)?($|\\.)",
339
- "(^|\\.)(toolspec|tool(_call)?(_grammar|_interface)?|harness|validator|rollback|receipt|patch|permission|session|worktree)(_adapter|_bridge|_head)?($|\\.)"
340
- ],
341
- "intents": [
342
- "harness_alignment",
343
- "runtime_protocol",
344
- "session_continuity",
345
- "worktree_discipline"
346
- ],
347
- "layer_window": {
348
- "mode": "all",
349
- "value": 0.0
350
- },
351
- "matched_module_names": [
352
- "failure_signal_bridge.rollback_bridge",
353
- "request_normalizer",
354
- "request_normalizer.adapter",
355
- "rollback_adapter",
356
- "rollback_adapter.head",
357
- "runtime_harness_adapter",
358
- "runtime_harness_adapter.bridge",
359
- "tool_protocol_adapter",
360
- "tool_protocol_adapter.bridge",
361
- "toolspec_bridge",
362
- "toolspec_bridge.adapter",
363
- "toolspec_head",
364
- "toolspec_head.param_schema_adapter",
365
- "toolspec_head.postcondition_adapter",
366
- "toolspec_head.precondition_adapter",
367
- "toolspec_head.receipt_formatter",
368
- "toolspec_head.trigger_gate",
369
- "toolspec_head.validator_gate",
370
- "validator_feedback_loop.rollback_adapter"
371
- ],
372
- "name": "group_2_custom_runtime_harness_bridge",
373
- "rank": 8,
374
- "rationale": "Runtime / harness obedience should attach to explicit interface bridges before any backbone fallback.",
375
- "risk": "low",
376
- "surface": "custom_runtime_harness_bridge"
377
- },
378
- {
379
- "alpha": 16,
380
- "dropout": 0.0,
381
- "exclude_patterns": [
382
- "(^|\\.)lm_head($|\\.)",
383
- "(^|\\.)embed_tokens($|\\.)",
384
- "(^|\\.)norm($|\\.)",
385
- "attnres|attention_residual",
386
- "dualpath",
387
- "mhc|hyper[-_]?connection",
388
- "rope|rotary",
389
- "kvcache|kv_cache",
390
- "(^|\\.)memory(_store|_bank)?($|\\.)"
391
- ],
392
- "include_patterns": [
393
- "(^|\\.)(validator_feedback|sandbox_result_validator|sandbox_rollback_bridge|failure_signal|rollback)(_adapter|_bridge|_head)?($|\\.)"
394
- ],
395
- "intents": [
396
- "validator_alignment"
397
- ],
398
- "layer_window": {
399
- "mode": "all",
400
- "value": 0.0
401
- },
402
- "matched_module_names": [
403
- "failure_signal_bridge",
404
- "failure_signal_bridge.rollback_bridge",
405
- "rollback_adapter",
406
- "rollback_adapter.head",
407
- "sandbox_rollback_bridge",
408
- "sandbox_rollback_bridge.adapter",
409
- "validator_feedback_bridge",
410
- "validator_feedback_bridge.adapter",
411
- "validator_feedback_loop.rollback_adapter"
412
- ],
413
- "name": "group_3_custom_validator_bridge",
414
- "rank": 8,
415
- "rationale": "Validation and rollback fidelity should prefer explicit validator / rollback bridges.",
416
- "risk": "low",
417
- "surface": "custom_validator_bridge"
418
- },
419
- {
420
- "alpha": 8,
421
- "dropout": 0.0,
422
- "exclude_patterns": [
423
- "(^|\\.)lm_head($|\\.)",
424
- "(^|\\.)embed_tokens($|\\.)",
425
- "(^|\\.)norm($|\\.)",
426
- "attnres|attention_residual",
427
- "dualpath",
428
- "mhc|hyper[-_]?connection",
429
- "rope|rotary",
430
- "kvcache|kv_cache",
431
- "(^|\\.)memory(_store|_bank)?($|\\.)"
432
- ],
433
- "include_patterns": [
434
- "(^|\\.)(memory_boundary_guard|episodic_memory|session_compactor)(_adapter|_bridge|_head)?($|\\.)"
435
- ],
436
- "intents": [
437
- "session_continuity"
438
- ],
439
- "layer_window": {
440
- "mode": "all",
441
- "value": 0.0
442
- },
443
- "matched_module_names": [
444
- "episodic_memory",
445
- "episodic_memory.adapter",
446
- "memory_boundary_guard",
447
- "memory_boundary_guard.adapter",
448
- "memory_boundary_guard.rollback_filter",
449
- "session_compactor",
450
- "session_compactor.adapter"
451
- ],
452
- "name": "group_4_custom_memory_boundary_bridge",
453
- "rank": 4,
454
- "rationale": "Session continuity should bind to boundary-aware memory packet surfaces rather than broad backbone tuning.",
455
- "risk": "low",
456
- "surface": "custom_memory_boundary_bridge"
457
- }
458
- ],
459
- "upstream_profile_hint": null,
460
- "version": "veriloop.peft_target_selector.v2",
461
- "warnings": []
462
- },
463
- "training_mode": "mounted_head",
464
- "version": "veriloop.uncertainty_adapter_trainer.v5.qwen36",
465
- "warnings": [
466
- "Harness Engineering is primary; PEFT is limited to obedience-facing, interface-facing support surfaces.",
467
- "Backbone bridge tuning disabled explicitly; selector stays on custom surfaces or no-op."
468
- ]
469
- }