gary-neuron / config.json
gary23w's picture
gary-neuron: async NCA + top-2 MoE, 26k params, 99.97%/100% exact-match on 7-digit addition
57f9808 verified
Raw
History Blame Contribute Delete
588 Bytes
{
"model_type": "gary-neuron",
"architecture": "asynchronous Neural Cellular Automaton (1-D strip, 8 cells) with a top-2 Mixture-of-Experts (K=6) per-cell update rule",
"task": "reversed-digit integer addition (Lee et al. 2023 format), up to 7-digit operands",
"S": 8,
"state_dim": 32,
"expert_hidden": 32,
"n_experts": 6,
"topk": 2,
"train_steps": 20,
"p_update": 0.5,
"recommended_inference_steps": 24,
"recommended_vote": 9,
"n_params": 26448,
"trained_step": 8948,
"exact_match_heldout_singleorder": 0.9997,
"exact_match_heldout_vote9": 1.0,
"dependencies": "numpy"
}