{ "D": 1024, "D_ff": 3072, "D_key": 128, "D_value": 128, "K": 12, "N": 8, "architectures": [ "NeuronSparkForCausalLM" ], "auto_map": { "AutoConfig": "configuration_neuronspark.NeuronSparkConfig", "AutoModelForCausalLM": "modeling_neuronspark.NeuronSparkForCausalLM" }, "bias_balancing_ema": 0.99, "bias_balancing_lr": 0.001, "bos_token_id": 1, "dtype": "bfloat16", "eos_token_id": 2, "eps_explore": 0.05, "k_predictor_hidden": 256, "memory_layer_interval": 4, "model_type": "neuronspark", "num_hidden_layers": 24, "num_layers": 24, "ponder_T_final": 0.3, "ponder_T_init": 2.0, "transformers_version": "5.6.2", "use_cache": false, "v_th_min": 0.02, "vocab_size": 128387 }