File size: 1,741 Bytes
3727dac | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 | {
"adapter_type": "guided_decoding",
"carnot_version": "0.1.0",
"spec": ["REQ-VERIFY-001", "SCENARIO-VERIFY-004"],
"constraint_types": [
"arithmetic",
"type_check",
"return_type",
"return_value_type",
"bound",
"initialization",
"implication",
"exclusion",
"disjunction",
"negation",
"universal",
"nl_consistency"
],
"default_weights": {
"arithmetic": 1.0,
"type_check": 1.0,
"return_type": 1.0,
"return_value_type":1.0,
"bound": 1.0,
"initialization": 0.8,
"implication": 0.9,
"exclusion": 0.9,
"disjunction": 0.7,
"negation": 0.8,
"universal": 0.7,
"nl_consistency": 0.5
},
"default_alpha": 0.5,
"default_check_every_k": 1,
"default_energy_threshold": 0.0,
"default_max_tokens": 256,
"default_temperature": 1.0,
"compatible_model_families": [
"Qwen/Qwen3-0.6B",
"Qwen/Qwen3.5-0.8B",
"Qwen/Qwen2.5-*",
"google/gemma-4-*",
"meta-llama/Llama-*",
"mistralai/Mistral-*"
],
"latency_profile": {
"constraint_check_p50_ms": 0.006,
"constraint_check_p99_ms": 0.034,
"extraction_p50_ms": 0.275,
"per_token_overhead_budget_fraction": 0.0004,
"source_experiments": ["Exp-102", "Exp-110"]
},
"known_limitations": [
"AutoExtractor min-text guard (< 5 chars) skips early tokens",
"No KV-cache: full forward pass every token — use max_tokens < 256 for speed",
"Uniform logit penalty preserves token ranking but does not steer vocabulary selection",
"Energy is a violation count, not a calibrated probability",
"Real-model validation pending (Exp-111); Exp-110 used MockArithmeticLLM"
]
}
|