{ "architectures": [ "HRMForCausalLM" ], "bos_token_id": 50256, "d_ff": 1536, "d_model": 768, "dropout": 0.0, "dtype": "float32", "eos_token_id": 50256, "episodic_mem_slots": 64, "head_dim": 64, "kv_lora_rank": 192, "layers_per_level": [ 3, 3, 3 ], "max_seq_len": 256, "model_type": "hrm", "moe_d_ff": 512, "mtp_heads": 2, "n_active_experts": 4, "n_experts": 16, "n_heads": 12, "n_levels": 3, "n_shared_experts": 1, "pad_token_id": 0, "q_lora_rank": 256, "rope_head_dim": 32, "semantic_mem_dim": 768, "semantic_mem_size": 512, "tie_embeddings": true, "transformers_version": "5.7.0", "vocab_size": 50257, "working_mem_slots": 16 }