ConorWang commited on
Commit
4882ac0
·
verified ·
1 Parent(s): a856587

Upload fine-tuned artifacts to repo root

Browse files
adapter/adapter_config.json CHANGED
@@ -30,8 +30,17 @@
30
  "rank_pattern": {},
31
  "revision": null,
32
  "target_modules": [
33
- "surface_host.uncertainty_head.proj",
34
- "surface_host.uncertainty_head.calibration_mlp"
 
 
 
 
 
 
 
 
 
35
  ],
36
  "target_parameters": null,
37
  "task_type": "FEATURE_EXTRACTION",
 
30
  "rank_pattern": {},
31
  "revision": null,
32
  "target_modules": [
33
+ "surface_host.toolspec_bridge.adapter",
34
+ "surface_host.validator_feedback_bridge.adapter",
35
+ "surface_host.toolspec_head.receipt_formatter",
36
+ "surface_host.toolspec_head.precondition_adapter",
37
+ "surface_host.toolspec_head.validator_gate",
38
+ "surface_host.toolspec_head.postcondition_adapter",
39
+ "surface_host.tool_protocol_adapter.bridge",
40
+ "surface_host.runtime_harness_adapter.bridge",
41
+ "surface_host.toolspec_head.trigger_gate",
42
+ "surface_host.request_normalizer.adapter",
43
+ "surface_host.toolspec_head.param_schema_adapter"
44
  ],
45
  "target_parameters": null,
46
  "task_type": "FEATURE_EXTRACTION",
adapter/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcca67011c0b0b0eaa44fc4826f4908bdd6ca8d82b192916a6e35556e292fa7f
3
- size 98968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e62775d0cd91a0604b237b7d50cdb1da249ec85e8f9a2c6ad4fd7ed8afc805a2
3
+ size 724048
best_checkpoint_manifest.json CHANGED
@@ -1,33 +1,27 @@
1
  {
2
- "best_epoch": 2,
3
- "best_quality_score": 0.8625935807221907,
4
  "eval_metrics": {
5
- "count": 55,
6
- "mae": {
7
- "u_answer": 0.15174226462841034,
8
- "u_evidence": 0.19610758125782013,
9
- "u_exec": 0.18561214208602905,
10
- "u_risk": 0.1553734689950943,
11
- "u_spec": 0.21633382141590118
12
- },
13
- "mean_mae": 0.18103384971618652,
14
- "mean_rmse": 0.24169571697711945,
15
- "moderate_accuracy": 0.6727272727272727,
16
- "quality_score": 0.8625935807221907,
17
- "rmse": {
18
- "u_answer": 0.18724055588245392,
19
- "u_evidence": 0.22527915239334106,
20
- "u_exec": 0.25238174200057983,
21
- "u_risk": 0.20667441189289093,
22
- "u_spec": 0.3369026482105255
23
- },
24
- "tight_accuracy": 0.4,
25
- "weighted_mae": 0.18083095811830807,
26
- "weighted_rmse": 0.24125460771003793
27
  },
28
  "train_metrics": {
29
- "loss": 0.009006613283418119,
30
- "micro_batches": 154,
31
- "optimizer_steps": 10
32
  }
33
  }
 
1
  {
2
+ "best_epoch": 4,
3
+ "best_quality_score": 0.46349615617231893,
4
  "eval_metrics": {
5
+ "avg_binary_accuracy": 0.81,
6
+ "confirmation_required_accuracy": 0.8,
7
+ "count": 25,
8
+ "eval_batches": 25,
9
+ "eval_loss": 6.897225952148437,
10
+ "mode_accuracy": 0.56,
11
+ "permission_bit_accuracy": 0.8545454545454545,
12
+ "precondition_ok_accuracy": 0.76,
13
+ "quality_score": 0.46349615617231893,
14
+ "rollback_supported_accuracy": 0.8,
15
+ "schema_ok_accuracy": 0.76,
16
+ "session_required_accuracy": 1.0,
17
+ "tool_accuracy": 0.44,
18
+ "trigger_accuracy": 0.76,
19
+ "validator_required_accuracy": 0.8,
20
+ "worktree_required_accuracy": 0.8
 
 
 
 
 
 
21
  },
22
  "train_metrics": {
23
+ "loss": 0.42175399448190415,
24
+ "micro_batches": 70,
25
+ "optimizer_steps": 5
26
  }
27
  }
epoch_history.json CHANGED
@@ -3,137 +3,141 @@
3
  {
4
  "epoch": 1,
5
  "eval_metrics": {
6
- "count": 55,
7
- "mae": {
8
- "u_answer": 0.1848176270723343,
9
- "u_evidence": 0.20735961198806763,
10
- "u_exec": 0.21166233718395233,
11
- "u_risk": 0.1652287244796753,
12
- "u_spec": 0.24522197246551514
13
- },
14
- "mean_mae": 0.2028580605983734,
15
- "mean_rmse": 0.2640994191169739,
16
- "moderate_accuracy": 0.6036363636363636,
17
- "quality_score": 0.8344919736975306,
18
- "rmse": {
19
- "u_answer": 0.2176007330417633,
20
- "u_evidence": 0.23360508680343628,
21
- "u_exec": 0.2795017957687378,
22
- "u_risk": 0.22334341704845428,
23
- "u_spec": 0.36644604802131653
24
- },
25
- "tight_accuracy": 0.36727272727272725,
26
- "weighted_mae": 0.20175925098418107,
27
- "weighted_rmse": 0.26307498343893954
28
  },
29
  "improved": true,
30
- "quality_score": 0.8344919736975306,
31
  "train_metrics": {
32
- "loss": 0.011121059906239584,
33
- "micro_batches": 154,
34
- "optimizer_steps": 10
35
  }
36
  },
37
  {
38
  "epoch": 2,
39
  "eval_metrics": {
40
- "count": 55,
41
- "mae": {
42
- "u_answer": 0.15174226462841034,
43
- "u_evidence": 0.19610758125782013,
44
- "u_exec": 0.18561214208602905,
45
- "u_risk": 0.1553734689950943,
46
- "u_spec": 0.21633382141590118
47
- },
48
- "mean_mae": 0.18103384971618652,
49
- "mean_rmse": 0.24169571697711945,
50
- "moderate_accuracy": 0.6727272727272727,
51
- "quality_score": 0.8625935807221907,
52
- "rmse": {
53
- "u_answer": 0.18724055588245392,
54
- "u_evidence": 0.22527915239334106,
55
- "u_exec": 0.25238174200057983,
56
- "u_risk": 0.20667441189289093,
57
- "u_spec": 0.3369026482105255
58
- },
59
- "tight_accuracy": 0.4,
60
- "weighted_mae": 0.18083095811830807,
61
- "weighted_rmse": 0.24125460771003793
62
  },
63
  "improved": true,
64
- "quality_score": 0.8625935807221907,
65
  "train_metrics": {
66
- "loss": 0.009006613283418119,
67
- "micro_batches": 154,
68
- "optimizer_steps": 10
69
  }
70
  },
71
  {
72
  "epoch": 3,
73
  "eval_metrics": {
74
- "count": 55,
75
- "mae": {
76
- "u_answer": 0.14970968663692474,
77
- "u_evidence": 0.19498984515666962,
78
- "u_exec": 0.18136857450008392,
79
- "u_risk": 0.1565144807100296,
80
- "u_spec": 0.21266111731529236
81
- },
82
- "mean_mae": 0.17904874682426453,
83
- "mean_rmse": 0.23914317786693573,
84
- "moderate_accuracy": 0.6545454545454545,
85
- "quality_score": 0.8630735522772117,
86
- "rmse": {
87
- "u_answer": 0.1858142465353012,
88
- "u_evidence": 0.22504529356956482,
89
- "u_exec": 0.24751117825508118,
90
- "u_risk": 0.20870783925056458,
91
- "u_spec": 0.3286373019218445
92
- },
93
- "tight_accuracy": 0.3927272727272727,
94
- "weighted_mae": 0.1789679336398722,
95
- "weighted_rmse": 0.23888496180570432
96
  },
97
  "improved": false,
98
- "quality_score": 0.8630735522772117,
99
  "train_metrics": {
100
- "loss": 0.008164266918108544,
101
- "micro_batches": 154,
102
- "optimizer_steps": 10
103
  }
104
  },
105
  {
106
  "epoch": 4,
107
  "eval_metrics": {
108
- "count": 55,
109
- "mae": {
110
- "u_answer": 0.1496635228395462,
111
- "u_evidence": 0.19500812888145447,
112
- "u_exec": 0.18158338963985443,
113
- "u_risk": 0.1564789116382599,
114
- "u_spec": 0.21253055334091187
115
- },
116
- "mean_mae": 0.1790529191493988,
117
- "mean_rmse": 0.23915143311023712,
118
- "moderate_accuracy": 0.6545454545454545,
119
- "quality_score": 0.8630639342548476,
120
- "rmse": {
121
- "u_answer": 0.1857716143131256,
122
- "u_evidence": 0.22511473298072815,
123
- "u_exec": 0.24768365919589996,
124
- "u_risk": 0.20870527625083923,
125
- "u_spec": 0.32848188281059265
126
- },
127
- "tight_accuracy": 0.3927272727272727,
128
- "weighted_mae": 0.17897483332915498,
129
- "weighted_rmse": 0.2388972981611497
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
130
  },
131
  "improved": false,
132
- "quality_score": 0.8630639342548476,
133
  "train_metrics": {
134
- "loss": 0.008081083455086723,
135
- "micro_batches": 154,
136
- "optimizer_steps": 10
137
  }
138
  }
139
  ]
 
3
  {
4
  "epoch": 1,
5
  "eval_metrics": {
6
+ "avg_binary_accuracy": 0.795,
7
+ "confirmation_required_accuracy": 0.8,
8
+ "count": 25,
9
+ "eval_batches": 25,
10
+ "eval_loss": 7.704372234344483,
11
+ "mode_accuracy": 0.44,
12
+ "permission_bit_accuracy": 0.850909090909091,
13
+ "precondition_ok_accuracy": 0.76,
14
+ "quality_score": 0.21877532557574186,
15
+ "rollback_supported_accuracy": 0.72,
16
+ "schema_ok_accuracy": 0.76,
17
+ "session_required_accuracy": 1.0,
18
+ "tool_accuracy": 0.24,
19
+ "trigger_accuracy": 0.76,
20
+ "validator_required_accuracy": 0.8,
21
+ "worktree_required_accuracy": 0.76
 
 
 
 
 
 
22
  },
23
  "improved": true,
24
+ "quality_score": 0.21877532557574186,
25
  "train_metrics": {
26
+ "loss": 0.5388983534915107,
27
+ "micro_batches": 70,
28
+ "optimizer_steps": 5
29
  }
30
  },
31
  {
32
  "epoch": 2,
33
  "eval_metrics": {
34
+ "avg_binary_accuracy": 0.81,
35
+ "confirmation_required_accuracy": 0.8,
36
+ "count": 25,
37
+ "eval_batches": 25,
38
+ "eval_loss": 7.129253711700439,
39
+ "mode_accuracy": 0.48,
40
+ "permission_bit_accuracy": 0.8545454545454545,
41
+ "precondition_ok_accuracy": 0.76,
42
+ "quality_score": 0.4400157397790389,
43
+ "rollback_supported_accuracy": 0.8,
44
+ "schema_ok_accuracy": 0.76,
45
+ "session_required_accuracy": 1.0,
46
+ "tool_accuracy": 0.44,
47
+ "trigger_accuracy": 0.76,
48
+ "validator_required_accuracy": 0.8,
49
+ "worktree_required_accuracy": 0.8
 
 
 
 
 
 
50
  },
51
  "improved": true,
52
+ "quality_score": 0.4400157397790389,
53
  "train_metrics": {
54
+ "loss": 0.4655745736190251,
55
+ "micro_batches": 70,
56
+ "optimizer_steps": 5
57
  }
58
  },
59
  {
60
  "epoch": 3,
61
  "eval_metrics": {
62
+ "avg_binary_accuracy": 0.81,
63
+ "confirmation_required_accuracy": 0.8,
64
+ "count": 25,
65
+ "eval_batches": 25,
66
+ "eval_loss": 6.935494079589843,
67
+ "mode_accuracy": 0.48,
68
+ "permission_bit_accuracy": 0.8545454545454545,
69
+ "precondition_ok_accuracy": 0.76,
70
+ "quality_score": 0.4229221342606978,
71
+ "rollback_supported_accuracy": 0.8,
72
+ "schema_ok_accuracy": 0.76,
73
+ "session_required_accuracy": 1.0,
74
+ "tool_accuracy": 0.4,
75
+ "trigger_accuracy": 0.76,
76
+ "validator_required_accuracy": 0.8,
77
+ "worktree_required_accuracy": 0.8
 
 
 
 
 
 
78
  },
79
  "improved": false,
80
+ "quality_score": 0.4229221342606978,
81
  "train_metrics": {
82
+ "loss": 0.43205853487764084,
83
+ "micro_batches": 70,
84
+ "optimizer_steps": 5
85
  }
86
  },
87
  {
88
  "epoch": 4,
89
  "eval_metrics": {
90
+ "avg_binary_accuracy": 0.81,
91
+ "confirmation_required_accuracy": 0.8,
92
+ "count": 25,
93
+ "eval_batches": 25,
94
+ "eval_loss": 6.897225952148437,
95
+ "mode_accuracy": 0.56,
96
+ "permission_bit_accuracy": 0.8545454545454545,
97
+ "precondition_ok_accuracy": 0.76,
98
+ "quality_score": 0.46349615617231893,
99
+ "rollback_supported_accuracy": 0.8,
100
+ "schema_ok_accuracy": 0.76,
101
+ "session_required_accuracy": 1.0,
102
+ "tool_accuracy": 0.44,
103
+ "trigger_accuracy": 0.76,
104
+ "validator_required_accuracy": 0.8,
105
+ "worktree_required_accuracy": 0.8
106
+ },
107
+ "improved": true,
108
+ "quality_score": 0.46349615617231893,
109
+ "train_metrics": {
110
+ "loss": 0.42175399448190415,
111
+ "micro_batches": 70,
112
+ "optimizer_steps": 5
113
+ }
114
+ },
115
+ {
116
+ "epoch": 5,
117
+ "eval_metrics": {
118
+ "avg_binary_accuracy": 0.81,
119
+ "confirmation_required_accuracy": 0.8,
120
+ "count": 25,
121
+ "eval_batches": 25,
122
+ "eval_loss": 6.89590030670166,
123
+ "mode_accuracy": 0.56,
124
+ "permission_bit_accuracy": 0.8545454545454545,
125
+ "precondition_ok_accuracy": 0.76,
126
+ "quality_score": 0.4635160408540206,
127
+ "rollback_supported_accuracy": 0.8,
128
+ "schema_ok_accuracy": 0.76,
129
+ "session_required_accuracy": 1.0,
130
+ "tool_accuracy": 0.44,
131
+ "trigger_accuracy": 0.76,
132
+ "validator_required_accuracy": 0.8,
133
+ "worktree_required_accuracy": 0.8
134
  },
135
  "improved": false,
136
+ "quality_score": 0.4635160408540206,
137
  "train_metrics": {
138
+ "loss": 0.4198248211826597,
139
+ "micro_batches": 70,
140
+ "optimizer_steps": 5
141
  }
142
  }
143
  ]
host_manifest.json CHANGED
@@ -68,6 +68,16 @@
68
  "query_runtime_engine.adapter",
69
  "request_normalizer",
70
  "request_normalizer.adapter",
 
 
 
 
 
 
 
 
 
 
71
  "rollback_adapter",
72
  "rollback_adapter.head",
73
  "rollback_engine",
@@ -76,6 +86,16 @@
76
  "runtime_binding.adapter",
77
  "runtime_harness_adapter",
78
  "runtime_harness_adapter.bridge",
 
 
 
 
 
 
 
 
 
 
79
  "runtime_harness_uncertainty_bridge",
80
  "runtime_harness_uncertainty_bridge.adapter",
81
  "sandbox_rollback_bridge",
@@ -87,40 +107,110 @@
87
  "session_state_manager.rollback_state",
88
  "tool_protocol_adapter",
89
  "tool_protocol_adapter.bridge",
 
 
 
 
 
 
 
 
 
 
90
  "toolspec_bridge",
91
  "toolspec_bridge.adapter",
 
 
 
 
 
 
 
 
 
 
92
  "toolspec_head",
93
  "toolspec_head.param_schema_adapter",
 
 
 
 
 
 
 
 
 
 
94
  "toolspec_head.postcondition_adapter",
 
 
 
 
 
 
 
 
 
 
95
  "toolspec_head.precondition_adapter",
 
 
 
 
 
 
 
 
 
 
96
  "toolspec_head.receipt_formatter",
 
 
 
 
 
 
 
 
 
 
97
  "toolspec_head.trigger_gate",
 
 
 
 
 
 
 
 
 
 
98
  "toolspec_head.validator_gate",
 
 
 
 
 
 
 
 
 
 
99
  "uncertainty_head",
100
  "uncertainty_head.calibration_mlp",
101
- "uncertainty_head.calibration_mlp.base_layer",
102
- "uncertainty_head.calibration_mlp.lora_A",
103
- "uncertainty_head.calibration_mlp.lora_A.default",
104
- "uncertainty_head.calibration_mlp.lora_B",
105
- "uncertainty_head.calibration_mlp.lora_B.default",
106
- "uncertainty_head.calibration_mlp.lora_dropout",
107
- "uncertainty_head.calibration_mlp.lora_dropout.default",
108
- "uncertainty_head.calibration_mlp.lora_embedding_A",
109
- "uncertainty_head.calibration_mlp.lora_embedding_B",
110
- "uncertainty_head.calibration_mlp.lora_magnitude_vector",
111
  "uncertainty_head.proj",
112
- "uncertainty_head.proj.base_layer",
113
- "uncertainty_head.proj.lora_A",
114
- "uncertainty_head.proj.lora_A.default",
115
- "uncertainty_head.proj.lora_B",
116
- "uncertainty_head.proj.lora_B.default",
117
- "uncertainty_head.proj.lora_dropout",
118
- "uncertainty_head.proj.lora_dropout.default",
119
- "uncertainty_head.proj.lora_embedding_A",
120
- "uncertainty_head.proj.lora_embedding_B",
121
- "uncertainty_head.proj.lora_magnitude_vector",
122
  "validator_feedback_bridge",
123
  "validator_feedback_bridge.adapter",
 
 
 
 
 
 
 
 
 
 
124
  "validator_feedback_loop",
125
  "validator_feedback_loop.rollback_adapter",
126
  "validator_receipt_bridge",
@@ -138,10 +228,10 @@
138
  "backbone_frozen": true,
139
  "backbone_present": true,
140
  "hidden_size": 2048,
141
- "host_parameters": 176310317,
142
- "host_trainable_parameters": 49192,
143
- "total_parameters": 34132368045,
144
- "trainable_parameters": 49192,
145
  "version": "veriloop.coder_peft_host.v1"
146
  },
147
  "version": "veriloop.coder_peft_host.v1"
 
68
  "query_runtime_engine.adapter",
69
  "request_normalizer",
70
  "request_normalizer.adapter",
71
+ "request_normalizer.adapter.base_layer",
72
+ "request_normalizer.adapter.lora_A",
73
+ "request_normalizer.adapter.lora_A.default",
74
+ "request_normalizer.adapter.lora_B",
75
+ "request_normalizer.adapter.lora_B.default",
76
+ "request_normalizer.adapter.lora_dropout",
77
+ "request_normalizer.adapter.lora_dropout.default",
78
+ "request_normalizer.adapter.lora_embedding_A",
79
+ "request_normalizer.adapter.lora_embedding_B",
80
+ "request_normalizer.adapter.lora_magnitude_vector",
81
  "rollback_adapter",
82
  "rollback_adapter.head",
83
  "rollback_engine",
 
86
  "runtime_binding.adapter",
87
  "runtime_harness_adapter",
88
  "runtime_harness_adapter.bridge",
89
+ "runtime_harness_adapter.bridge.base_layer",
90
+ "runtime_harness_adapter.bridge.lora_A",
91
+ "runtime_harness_adapter.bridge.lora_A.default",
92
+ "runtime_harness_adapter.bridge.lora_B",
93
+ "runtime_harness_adapter.bridge.lora_B.default",
94
+ "runtime_harness_adapter.bridge.lora_dropout",
95
+ "runtime_harness_adapter.bridge.lora_dropout.default",
96
+ "runtime_harness_adapter.bridge.lora_embedding_A",
97
+ "runtime_harness_adapter.bridge.lora_embedding_B",
98
+ "runtime_harness_adapter.bridge.lora_magnitude_vector",
99
  "runtime_harness_uncertainty_bridge",
100
  "runtime_harness_uncertainty_bridge.adapter",
101
  "sandbox_rollback_bridge",
 
107
  "session_state_manager.rollback_state",
108
  "tool_protocol_adapter",
109
  "tool_protocol_adapter.bridge",
110
+ "tool_protocol_adapter.bridge.base_layer",
111
+ "tool_protocol_adapter.bridge.lora_A",
112
+ "tool_protocol_adapter.bridge.lora_A.default",
113
+ "tool_protocol_adapter.bridge.lora_B",
114
+ "tool_protocol_adapter.bridge.lora_B.default",
115
+ "tool_protocol_adapter.bridge.lora_dropout",
116
+ "tool_protocol_adapter.bridge.lora_dropout.default",
117
+ "tool_protocol_adapter.bridge.lora_embedding_A",
118
+ "tool_protocol_adapter.bridge.lora_embedding_B",
119
+ "tool_protocol_adapter.bridge.lora_magnitude_vector",
120
  "toolspec_bridge",
121
  "toolspec_bridge.adapter",
122
+ "toolspec_bridge.adapter.base_layer",
123
+ "toolspec_bridge.adapter.lora_A",
124
+ "toolspec_bridge.adapter.lora_A.default",
125
+ "toolspec_bridge.adapter.lora_B",
126
+ "toolspec_bridge.adapter.lora_B.default",
127
+ "toolspec_bridge.adapter.lora_dropout",
128
+ "toolspec_bridge.adapter.lora_dropout.default",
129
+ "toolspec_bridge.adapter.lora_embedding_A",
130
+ "toolspec_bridge.adapter.lora_embedding_B",
131
+ "toolspec_bridge.adapter.lora_magnitude_vector",
132
  "toolspec_head",
133
  "toolspec_head.param_schema_adapter",
134
+ "toolspec_head.param_schema_adapter.base_layer",
135
+ "toolspec_head.param_schema_adapter.lora_A",
136
+ "toolspec_head.param_schema_adapter.lora_A.default",
137
+ "toolspec_head.param_schema_adapter.lora_B",
138
+ "toolspec_head.param_schema_adapter.lora_B.default",
139
+ "toolspec_head.param_schema_adapter.lora_dropout",
140
+ "toolspec_head.param_schema_adapter.lora_dropout.default",
141
+ "toolspec_head.param_schema_adapter.lora_embedding_A",
142
+ "toolspec_head.param_schema_adapter.lora_embedding_B",
143
+ "toolspec_head.param_schema_adapter.lora_magnitude_vector",
144
  "toolspec_head.postcondition_adapter",
145
+ "toolspec_head.postcondition_adapter.base_layer",
146
+ "toolspec_head.postcondition_adapter.lora_A",
147
+ "toolspec_head.postcondition_adapter.lora_A.default",
148
+ "toolspec_head.postcondition_adapter.lora_B",
149
+ "toolspec_head.postcondition_adapter.lora_B.default",
150
+ "toolspec_head.postcondition_adapter.lora_dropout",
151
+ "toolspec_head.postcondition_adapter.lora_dropout.default",
152
+ "toolspec_head.postcondition_adapter.lora_embedding_A",
153
+ "toolspec_head.postcondition_adapter.lora_embedding_B",
154
+ "toolspec_head.postcondition_adapter.lora_magnitude_vector",
155
  "toolspec_head.precondition_adapter",
156
+ "toolspec_head.precondition_adapter.base_layer",
157
+ "toolspec_head.precondition_adapter.lora_A",
158
+ "toolspec_head.precondition_adapter.lora_A.default",
159
+ "toolspec_head.precondition_adapter.lora_B",
160
+ "toolspec_head.precondition_adapter.lora_B.default",
161
+ "toolspec_head.precondition_adapter.lora_dropout",
162
+ "toolspec_head.precondition_adapter.lora_dropout.default",
163
+ "toolspec_head.precondition_adapter.lora_embedding_A",
164
+ "toolspec_head.precondition_adapter.lora_embedding_B",
165
+ "toolspec_head.precondition_adapter.lora_magnitude_vector",
166
  "toolspec_head.receipt_formatter",
167
+ "toolspec_head.receipt_formatter.base_layer",
168
+ "toolspec_head.receipt_formatter.lora_A",
169
+ "toolspec_head.receipt_formatter.lora_A.default",
170
+ "toolspec_head.receipt_formatter.lora_B",
171
+ "toolspec_head.receipt_formatter.lora_B.default",
172
+ "toolspec_head.receipt_formatter.lora_dropout",
173
+ "toolspec_head.receipt_formatter.lora_dropout.default",
174
+ "toolspec_head.receipt_formatter.lora_embedding_A",
175
+ "toolspec_head.receipt_formatter.lora_embedding_B",
176
+ "toolspec_head.receipt_formatter.lora_magnitude_vector",
177
  "toolspec_head.trigger_gate",
178
+ "toolspec_head.trigger_gate.base_layer",
179
+ "toolspec_head.trigger_gate.lora_A",
180
+ "toolspec_head.trigger_gate.lora_A.default",
181
+ "toolspec_head.trigger_gate.lora_B",
182
+ "toolspec_head.trigger_gate.lora_B.default",
183
+ "toolspec_head.trigger_gate.lora_dropout",
184
+ "toolspec_head.trigger_gate.lora_dropout.default",
185
+ "toolspec_head.trigger_gate.lora_embedding_A",
186
+ "toolspec_head.trigger_gate.lora_embedding_B",
187
+ "toolspec_head.trigger_gate.lora_magnitude_vector",
188
  "toolspec_head.validator_gate",
189
+ "toolspec_head.validator_gate.base_layer",
190
+ "toolspec_head.validator_gate.lora_A",
191
+ "toolspec_head.validator_gate.lora_A.default",
192
+ "toolspec_head.validator_gate.lora_B",
193
+ "toolspec_head.validator_gate.lora_B.default",
194
+ "toolspec_head.validator_gate.lora_dropout",
195
+ "toolspec_head.validator_gate.lora_dropout.default",
196
+ "toolspec_head.validator_gate.lora_embedding_A",
197
+ "toolspec_head.validator_gate.lora_embedding_B",
198
+ "toolspec_head.validator_gate.lora_magnitude_vector",
199
  "uncertainty_head",
200
  "uncertainty_head.calibration_mlp",
 
 
 
 
 
 
 
 
 
 
201
  "uncertainty_head.proj",
 
 
 
 
 
 
 
 
 
 
202
  "validator_feedback_bridge",
203
  "validator_feedback_bridge.adapter",
204
+ "validator_feedback_bridge.adapter.base_layer",
205
+ "validator_feedback_bridge.adapter.lora_A",
206
+ "validator_feedback_bridge.adapter.lora_A.default",
207
+ "validator_feedback_bridge.adapter.lora_B",
208
+ "validator_feedback_bridge.adapter.lora_B.default",
209
+ "validator_feedback_bridge.adapter.lora_dropout",
210
+ "validator_feedback_bridge.adapter.lora_dropout.default",
211
+ "validator_feedback_bridge.adapter.lora_embedding_A",
212
+ "validator_feedback_bridge.adapter.lora_embedding_B",
213
+ "validator_feedback_bridge.adapter.lora_magnitude_vector",
214
  "validator_feedback_loop",
215
  "validator_feedback_loop.rollback_adapter",
216
  "validator_receipt_bridge",
 
228
  "backbone_frozen": true,
229
  "backbone_present": true,
230
  "hidden_size": 2048,
231
+ "host_parameters": 176621573,
232
+ "host_trainable_parameters": 360448,
233
+ "total_parameters": 34132679301,
234
+ "trainable_parameters": 360448,
235
  "version": "veriloop.coder_peft_host.v1"
236
  },
237
  "version": "veriloop.coder_peft_host.v1"
tokenizer/tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea2e66b594a0906e9a547c9e6ff9e5fb8a8198439c8cf7d6dc48f23529161223
3
  size 19989442
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a0316e38d81a31965b770393461dcc03612ac06e2733f8e1cc440d36a2ef189
3
  size 19989442