| { | |
| "model_type": "gary-neuron", | |
| "architecture": "asynchronous Neural Cellular Automaton (1-D strip, 8 cells) with a top-2 Mixture-of-Experts (K=6) per-cell update rule", | |
| "task": "reversed-digit integer addition (Lee et al. 2023 format), up to 7-digit operands", | |
| "S": 8, | |
| "state_dim": 32, | |
| "expert_hidden": 32, | |
| "n_experts": 6, | |
| "topk": 2, | |
| "train_steps": 20, | |
| "p_update": 0.5, | |
| "recommended_inference_steps": 24, | |
| "recommended_vote": 9, | |
| "n_params": 26448, | |
| "trained_step": 8948, | |
| "exact_match_heldout_singleorder": 0.9997, | |
| "exact_match_heldout_vote9": 1.0, | |
| "dependencies": "numpy" | |
| } |