| { |
| "layers": { |
| "language_model.model.layers.10.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.10.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.11.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.12.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.13.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.14.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.15.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.16.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.17.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.18.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.19.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.20.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.21.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.22.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.23.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.24.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.25.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.26.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.27.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.28.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.29.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.30.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.31.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.32.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.33.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.34.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.35.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.36.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.37.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.38.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.self_attn.k_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.self_attn.o_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.self_attn.q_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.39.self_attn.v_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.8.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.linear_attn.in_proj_a": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.linear_attn.in_proj_b": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.linear_attn.in_proj_qkv": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.linear_attn.in_proj_z": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.linear_attn.out_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.shared_expert.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.shared_expert.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.shared_expert.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.shared_expert_gate": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.switch_mlp.down_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.switch_mlp.gate_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| }, |
| "language_model.model.layers.9.mlp.switch_mlp.up_proj": { |
| "matched_snn_key": null, |
| "max_rate": 1.0, |
| "tau": 1.0, |
| "threshold": 0.0078125, |
| "timesteps": 128 |
| } |
| }, |
| "num_modules": 408, |
| "snn_base": "/Users/clems/KIKI-Mac_tunner/models/SpikingKiki-35B-A3B-V4", |
| "source_adapter": "output/micro-kiki/lora-qwen36-35b-v4-sota/python/adapters.safetensors", |
| "validation_samples": [ |
| { |
| "abs_max": 0.06933634728193283, |
| "ann_abs_max": 0.07714884728193283, |
| "module": "language_model.model.layers.10.linear_attn.in_proj_a", |
| "rel_l2": 0.9113689466205737 |
| }, |
| { |
| "abs_max": 0.1121697723865509, |
| "ann_abs_max": 0.1277947723865509, |
| "module": "language_model.model.layers.10.linear_attn.in_proj_b", |
| "rel_l2": 0.8993570745977573 |
| }, |
| { |
| "abs_max": 0.1508132517337799, |
| "ann_abs_max": 0.1742507517337799, |
| "module": "language_model.model.layers.10.linear_attn.in_proj_qkv", |
| "rel_l2": 0.911129281981103 |
| } |
| ], |
| "version": "0.1.0" |
| } |
|
|