spikingkiki-v4-adapters / python /lif_metadata.json
clemsail's picture
Add files using upload-large-folder tool
04cd6b7 verified
{
"layers": {
"language_model.model.layers.10.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.10.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.11.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.12.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.13.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.14.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.15.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.16.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.17.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.18.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.19.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.20.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.21.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.22.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.23.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.24.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.25.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.26.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.27.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.28.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.29.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.30.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.31.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.32.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.33.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.34.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.35.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.36.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.37.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.38.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.self_attn.k_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.self_attn.o_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.self_attn.q_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.39.self_attn.v_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.8.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.linear_attn.in_proj_a": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.linear_attn.in_proj_b": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.linear_attn.in_proj_qkv": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.linear_attn.in_proj_z": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.linear_attn.out_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.shared_expert.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.shared_expert.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.shared_expert.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.shared_expert_gate": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.switch_mlp.down_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.switch_mlp.gate_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
},
"language_model.model.layers.9.mlp.switch_mlp.up_proj": {
"matched_snn_key": null,
"max_rate": 1.0,
"tau": 1.0,
"threshold": 0.0078125,
"timesteps": 128
}
},
"num_modules": 408,
"snn_base": "/Users/clems/KIKI-Mac_tunner/models/SpikingKiki-35B-A3B-V4",
"source_adapter": "output/micro-kiki/lora-qwen36-35b-v4-sota/python/adapters.safetensors",
"validation_samples": [
{
"abs_max": 0.06933634728193283,
"ann_abs_max": 0.07714884728193283,
"module": "language_model.model.layers.10.linear_attn.in_proj_a",
"rel_l2": 0.9113689466205737
},
{
"abs_max": 0.1121697723865509,
"ann_abs_max": 0.1277947723865509,
"module": "language_model.model.layers.10.linear_attn.in_proj_b",
"rel_l2": 0.8993570745977573
},
{
"abs_max": 0.1508132517337799,
"ann_abs_max": 0.1742507517337799,
"module": "language_model.model.layers.10.linear_attn.in_proj_qkv",
"rel_l2": 0.911129281981103
}
],
"version": "0.1.0"
}