diff --git a/evo-kl-configuration-2.5-v2.txt b/evo-kl-configuration-2.5-v2.txt new file mode 100644 index 0000000000000000000000000000000000000000..e1ae9dd50994b874db3f3d85c6df1c33cf348a4c --- /dev/null +++ b/evo-kl-configuration-2.5-v2.txt @@ -0,0 +1,224 @@ +model.layers.0.mlp.down_proj: 4 +model.layers.0.mlp.gate_proj: 2 +model.layers.0.mlp.up_proj: 3 +model.layers.1.mlp.down_proj: 4 +model.layers.1.mlp.gate_proj: 3 +model.layers.1.mlp.up_proj: 3 +model.layers.2.mlp.down_proj: 3 +model.layers.2.mlp.gate_proj: 2 +model.layers.2.mlp.up_proj: 3 +model.layers.3.mlp.down_proj: 3 +model.layers.3.mlp.gate_proj: 2 +model.layers.3.mlp.up_proj: 3 +model.layers.4.mlp.down_proj: 3 +model.layers.4.mlp.gate_proj: 2 +model.layers.4.mlp.up_proj: 3 +model.layers.5.mlp.down_proj: 3 +model.layers.5.mlp.gate_proj: 2 +model.layers.5.mlp.up_proj: 3 +model.layers.6.mlp.down_proj: 3 +model.layers.6.mlp.gate_proj: 2 +model.layers.6.mlp.up_proj: 3 +model.layers.7.mlp.down_proj: 3 +model.layers.7.mlp.gate_proj: 2 +model.layers.7.mlp.up_proj: 2 +model.layers.8.mlp.down_proj: 3 +model.layers.8.mlp.gate_proj: 2 +model.layers.8.mlp.up_proj: 3 +model.layers.9.mlp.down_proj: 3 +model.layers.9.mlp.gate_proj: 2 +model.layers.9.mlp.up_proj: 3 +model.layers.10.mlp.down_proj: 2 +model.layers.10.mlp.gate_proj: 2 +model.layers.10.mlp.up_proj: 3 +model.layers.11.mlp.down_proj: 2 +model.layers.11.mlp.gate_proj: 2 +model.layers.11.mlp.up_proj: 2 +model.layers.12.mlp.down_proj: 3 +model.layers.12.mlp.gate_proj: 2 +model.layers.12.mlp.up_proj: 2 +model.layers.13.mlp.down_proj: 3 +model.layers.13.mlp.gate_proj: 3 +model.layers.13.mlp.up_proj: 3 +model.layers.14.mlp.down_proj: 3 +model.layers.14.mlp.gate_proj: 2 +model.layers.14.mlp.up_proj: 3 +model.layers.15.mlp.down_proj: 3 +model.layers.15.mlp.gate_proj: 2 +model.layers.15.mlp.up_proj: 3 +model.layers.16.mlp.down_proj: 3 +model.layers.16.mlp.gate_proj: 2 +model.layers.16.mlp.up_proj: 3 +model.layers.17.mlp.down_proj: 3 +model.layers.17.mlp.gate_proj: 2 +model.layers.17.mlp.up_proj: 3 +model.layers.18.mlp.down_proj: 3 +model.layers.18.mlp.gate_proj: 2 +model.layers.18.mlp.up_proj: 3 +model.layers.19.mlp.down_proj: 2 +model.layers.19.mlp.gate_proj: 2 +model.layers.19.mlp.up_proj: 3 +model.layers.20.mlp.down_proj: 2 +model.layers.20.mlp.gate_proj: 2 +model.layers.20.mlp.up_proj: 2 +model.layers.21.mlp.down_proj: 3 +model.layers.21.mlp.gate_proj: 2 +model.layers.21.mlp.up_proj: 2 +model.layers.22.mlp.down_proj: 2 +model.layers.22.mlp.gate_proj: 2 +model.layers.22.mlp.up_proj: 2 +model.layers.23.mlp.down_proj: 2 +model.layers.23.mlp.gate_proj: 2 +model.layers.23.mlp.up_proj: 2 +model.layers.24.mlp.down_proj: 2 +model.layers.24.mlp.gate_proj: 2 +model.layers.24.mlp.up_proj: 3 +model.layers.25.mlp.down_proj: 2 +model.layers.25.mlp.gate_proj: 2 +model.layers.25.mlp.up_proj: 2 +model.layers.26.mlp.down_proj: 2 +model.layers.26.mlp.gate_proj: 2 +model.layers.26.mlp.up_proj: 2 +model.layers.27.mlp.down_proj: 2 +model.layers.27.mlp.gate_proj: 3 +model.layers.27.mlp.up_proj: 2 +model.layers.28.mlp.down_proj: 2 +model.layers.28.mlp.gate_proj: 2 +model.layers.28.mlp.up_proj: 2 +model.layers.29.mlp.down_proj: 2 +model.layers.29.mlp.gate_proj: 2 +model.layers.29.mlp.up_proj: 2 +model.layers.30.mlp.down_proj: 3 +model.layers.30.mlp.gate_proj: 2 +model.layers.30.mlp.up_proj: 2 +model.layers.31.mlp.down_proj: 3 +model.layers.31.mlp.gate_proj: 2 +model.layers.31.mlp.up_proj: 3 +model.layers.0.self_attn.k_proj: 2 +model.layers.0.self_attn.v_proj: 3 +model.layers.1.self_attn.k_proj: 3 +model.layers.1.self_attn.v_proj: 6 +model.layers.2.self_attn.k_proj: 3 +model.layers.2.self_attn.v_proj: 3 +model.layers.3.self_attn.k_proj: 3 +model.layers.3.self_attn.v_proj: 2 +model.layers.4.self_attn.k_proj: 3 +model.layers.4.self_attn.v_proj: 3 +model.layers.5.self_attn.k_proj: 3 +model.layers.5.self_attn.v_proj: 3 +model.layers.6.self_attn.k_proj: 3 +model.layers.6.self_attn.v_proj: 3 +model.layers.7.self_attn.k_proj: 3 +model.layers.7.self_attn.v_proj: 2 +model.layers.8.self_attn.k_proj: 3 +model.layers.8.self_attn.v_proj: 3 +model.layers.9.self_attn.k_proj: 3 +model.layers.9.self_attn.v_proj: 3 +model.layers.10.self_attn.k_proj: 3 +model.layers.10.self_attn.v_proj: 3 +model.layers.11.self_attn.k_proj: 3 +model.layers.11.self_attn.v_proj: 3 +model.layers.12.self_attn.k_proj: 2 +model.layers.12.self_attn.v_proj: 3 +model.layers.13.self_attn.k_proj: 3 +model.layers.13.self_attn.v_proj: 3 +model.layers.14.self_attn.k_proj: 3 +model.layers.14.self_attn.v_proj: 2 +model.layers.15.self_attn.k_proj: 3 +model.layers.15.self_attn.v_proj: 3 +model.layers.16.self_attn.k_proj: 2 +model.layers.16.self_attn.v_proj: 3 +model.layers.17.self_attn.k_proj: 2 +model.layers.17.self_attn.v_proj: 3 +model.layers.18.self_attn.k_proj: 2 +model.layers.18.self_attn.v_proj: 3 +model.layers.19.self_attn.k_proj: 2 +model.layers.19.self_attn.v_proj: 2 +model.layers.20.self_attn.k_proj: 2 +model.layers.20.self_attn.v_proj: 2 +model.layers.21.self_attn.k_proj: 2 +model.layers.21.self_attn.v_proj: 3 +model.layers.22.self_attn.k_proj: 2 +model.layers.22.self_attn.v_proj: 2 +model.layers.23.self_attn.k_proj: 2 +model.layers.23.self_attn.v_proj: 2 +model.layers.24.self_attn.k_proj: 2 +model.layers.24.self_attn.v_proj: 2 +model.layers.25.self_attn.k_proj: 2 +model.layers.25.self_attn.v_proj: 2 +model.layers.26.self_attn.k_proj: 2 +model.layers.26.self_attn.v_proj: 2 +model.layers.27.self_attn.k_proj: 2 +model.layers.27.self_attn.v_proj: 2 +model.layers.28.self_attn.k_proj: 2 +model.layers.28.self_attn.v_proj: 2 +model.layers.29.self_attn.k_proj: 2 +model.layers.29.self_attn.v_proj: 2 +model.layers.30.self_attn.k_proj: 2 +model.layers.30.self_attn.v_proj: 2 +model.layers.31.self_attn.k_proj: 3 +model.layers.31.self_attn.v_proj: 3 +model.layers.0.self_attn.o_proj: 3 +model.layers.0.self_attn.q_proj: 2 +model.layers.1.self_attn.o_proj: 3 +model.layers.1.self_attn.q_proj: 2 +model.layers.2.self_attn.o_proj: 3 +model.layers.2.self_attn.q_proj: 3 +model.layers.3.self_attn.o_proj: 3 +model.layers.3.self_attn.q_proj: 4 +model.layers.4.self_attn.o_proj: 4 +model.layers.4.self_attn.q_proj: 3 +model.layers.5.self_attn.o_proj: 3 +model.layers.5.self_attn.q_proj: 3 +model.layers.6.self_attn.o_proj: 3 +model.layers.6.self_attn.q_proj: 3 +model.layers.7.self_attn.o_proj: 3 +model.layers.7.self_attn.q_proj: 3 +model.layers.8.self_attn.o_proj: 3 +model.layers.8.self_attn.q_proj: 3 +model.layers.9.self_attn.o_proj: 4 +model.layers.9.self_attn.q_proj: 3 +model.layers.10.self_attn.o_proj: 3 +model.layers.10.self_attn.q_proj: 3 +model.layers.11.self_attn.o_proj: 3 +model.layers.11.self_attn.q_proj: 3 +model.layers.12.self_attn.o_proj: 3 +model.layers.12.self_attn.q_proj: 2 +model.layers.13.self_attn.o_proj: 3 +model.layers.13.self_attn.q_proj: 2 +model.layers.14.self_attn.o_proj: 3 +model.layers.14.self_attn.q_proj: 3 +model.layers.15.self_attn.o_proj: 3 +model.layers.15.self_attn.q_proj: 3 +model.layers.16.self_attn.o_proj: 3 +model.layers.16.self_attn.q_proj: 3 +model.layers.17.self_attn.o_proj: 3 +model.layers.17.self_attn.q_proj: 2 +model.layers.18.self_attn.o_proj: 2 +model.layers.18.self_attn.q_proj: 2 +model.layers.19.self_attn.o_proj: 2 +model.layers.19.self_attn.q_proj: 3 +model.layers.20.self_attn.o_proj: 2 +model.layers.20.self_attn.q_proj: 2 +model.layers.21.self_attn.o_proj: 3 +model.layers.21.self_attn.q_proj: 2 +model.layers.22.self_attn.o_proj: 3 +model.layers.22.self_attn.q_proj: 2 +model.layers.23.self_attn.o_proj: 2 +model.layers.23.self_attn.q_proj: 2 +model.layers.24.self_attn.o_proj: 2 +model.layers.24.self_attn.q_proj: 2 +model.layers.25.self_attn.o_proj: 2 +model.layers.25.self_attn.q_proj: 2 +model.layers.26.self_attn.o_proj: 2 +model.layers.26.self_attn.q_proj: 2 +model.layers.27.self_attn.o_proj: 3 +model.layers.27.self_attn.q_proj: 2 +model.layers.28.self_attn.o_proj: 2 +model.layers.28.self_attn.q_proj: 2 +model.layers.29.self_attn.o_proj: 2 +model.layers.29.self_attn.q_proj: 3 +model.layers.30.self_attn.o_proj: 3 +model.layers.30.self_attn.q_proj: 2 +model.layers.31.self_attn.o_proj: 3 +model.layers.31.self_attn.q_proj: 2 \ No newline at end of file diff --git a/evo-kl-configuration-2.75-v2.txt b/evo-kl-configuration-2.75-v2.txt new file mode 100644 index 0000000000000000000000000000000000000000..1aff1685ce1bffa16acdf2f58bcac0d62a2bf0a4 --- /dev/null +++ b/evo-kl-configuration-2.75-v2.txt @@ -0,0 +1,224 @@ +model.layers.0.mlp.down_proj: 3 +model.layers.0.mlp.gate_proj: 3 +model.layers.0.mlp.up_proj: 3 +model.layers.1.mlp.down_proj: 4 +model.layers.1.mlp.gate_proj: 2 +model.layers.1.mlp.up_proj: 3 +model.layers.2.mlp.down_proj: 3 +model.layers.2.mlp.gate_proj: 2 +model.layers.2.mlp.up_proj: 3 +model.layers.3.mlp.down_proj: 3 +model.layers.3.mlp.gate_proj: 2 +model.layers.3.mlp.up_proj: 3 +model.layers.4.mlp.down_proj: 3 +model.layers.4.mlp.gate_proj: 3 +model.layers.4.mlp.up_proj: 3 +model.layers.5.mlp.down_proj: 3 +model.layers.5.mlp.gate_proj: 2 +model.layers.5.mlp.up_proj: 3 +model.layers.6.mlp.down_proj: 3 +model.layers.6.mlp.gate_proj: 2 +model.layers.6.mlp.up_proj: 3 +model.layers.7.mlp.down_proj: 3 +model.layers.7.mlp.gate_proj: 3 +model.layers.7.mlp.up_proj: 3 +model.layers.8.mlp.down_proj: 3 +model.layers.8.mlp.gate_proj: 3 +model.layers.8.mlp.up_proj: 3 +model.layers.9.mlp.down_proj: 3 +model.layers.9.mlp.gate_proj: 2 +model.layers.9.mlp.up_proj: 3 +model.layers.10.mlp.down_proj: 3 +model.layers.10.mlp.gate_proj: 2 +model.layers.10.mlp.up_proj: 3 +model.layers.11.mlp.down_proj: 3 +model.layers.11.mlp.gate_proj: 2 +model.layers.11.mlp.up_proj: 3 +model.layers.12.mlp.down_proj: 3 +model.layers.12.mlp.gate_proj: 3 +model.layers.12.mlp.up_proj: 3 +model.layers.13.mlp.down_proj: 3 +model.layers.13.mlp.gate_proj: 2 +model.layers.13.mlp.up_proj: 3 +model.layers.14.mlp.down_proj: 3 +model.layers.14.mlp.gate_proj: 3 +model.layers.14.mlp.up_proj: 3 +model.layers.15.mlp.down_proj: 3 +model.layers.15.mlp.gate_proj: 2 +model.layers.15.mlp.up_proj: 3 +model.layers.16.mlp.down_proj: 3 +model.layers.16.mlp.gate_proj: 2 +model.layers.16.mlp.up_proj: 3 +model.layers.17.mlp.down_proj: 3 +model.layers.17.mlp.gate_proj: 2 +model.layers.17.mlp.up_proj: 3 +model.layers.18.mlp.down_proj: 3 +model.layers.18.mlp.gate_proj: 2 +model.layers.18.mlp.up_proj: 3 +model.layers.19.mlp.down_proj: 3 +model.layers.19.mlp.gate_proj: 2 +model.layers.19.mlp.up_proj: 3 +model.layers.20.mlp.down_proj: 3 +model.layers.20.mlp.gate_proj: 2 +model.layers.20.mlp.up_proj: 3 +model.layers.21.mlp.down_proj: 3 +model.layers.21.mlp.gate_proj: 3 +model.layers.21.mlp.up_proj: 3 +model.layers.22.mlp.down_proj: 3 +model.layers.22.mlp.gate_proj: 2 +model.layers.22.mlp.up_proj: 3 +model.layers.23.mlp.down_proj: 3 +model.layers.23.mlp.gate_proj: 2 +model.layers.23.mlp.up_proj: 3 +model.layers.24.mlp.down_proj: 2 +model.layers.24.mlp.gate_proj: 2 +model.layers.24.mlp.up_proj: 3 +model.layers.25.mlp.down_proj: 3 +model.layers.25.mlp.gate_proj: 2 +model.layers.25.mlp.up_proj: 3 +model.layers.26.mlp.down_proj: 2 +model.layers.26.mlp.gate_proj: 2 +model.layers.26.mlp.up_proj: 2 +model.layers.27.mlp.down_proj: 3 +model.layers.27.mlp.gate_proj: 3 +model.layers.27.mlp.up_proj: 3 +model.layers.28.mlp.down_proj: 3 +model.layers.28.mlp.gate_proj: 2 +model.layers.28.mlp.up_proj: 2 +model.layers.29.mlp.down_proj: 3 +model.layers.29.mlp.gate_proj: 2 +model.layers.29.mlp.up_proj: 2 +model.layers.30.mlp.down_proj: 3 +model.layers.30.mlp.gate_proj: 3 +model.layers.30.mlp.up_proj: 3 +model.layers.31.mlp.down_proj: 3 +model.layers.31.mlp.gate_proj: 2 +model.layers.31.mlp.up_proj: 3 +model.layers.0.self_attn.k_proj: 3 +model.layers.0.self_attn.v_proj: 3 +model.layers.1.self_attn.k_proj: 3 +model.layers.1.self_attn.v_proj: 6 +model.layers.2.self_attn.k_proj: 3 +model.layers.2.self_attn.v_proj: 3 +model.layers.3.self_attn.k_proj: 3 +model.layers.3.self_attn.v_proj: 3 +model.layers.4.self_attn.k_proj: 3 +model.layers.4.self_attn.v_proj: 4 +model.layers.5.self_attn.k_proj: 3 +model.layers.5.self_attn.v_proj: 4 +model.layers.6.self_attn.k_proj: 3 +model.layers.6.self_attn.v_proj: 3 +model.layers.7.self_attn.k_proj: 3 +model.layers.7.self_attn.v_proj: 2 +model.layers.8.self_attn.k_proj: 3 +model.layers.8.self_attn.v_proj: 3 +model.layers.9.self_attn.k_proj: 3 +model.layers.9.self_attn.v_proj: 3 +model.layers.10.self_attn.k_proj: 3 +model.layers.10.self_attn.v_proj: 4 +model.layers.11.self_attn.k_proj: 3 +model.layers.11.self_attn.v_proj: 3 +model.layers.12.self_attn.k_proj: 3 +model.layers.12.self_attn.v_proj: 3 +model.layers.13.self_attn.k_proj: 3 +model.layers.13.self_attn.v_proj: 3 +model.layers.14.self_attn.k_proj: 3 +model.layers.14.self_attn.v_proj: 3 +model.layers.15.self_attn.k_proj: 3 +model.layers.15.self_attn.v_proj: 3 +model.layers.16.self_attn.k_proj: 2 +model.layers.16.self_attn.v_proj: 3 +model.layers.17.self_attn.k_proj: 2 +model.layers.17.self_attn.v_proj: 3 +model.layers.18.self_attn.k_proj: 3 +model.layers.18.self_attn.v_proj: 2 +model.layers.19.self_attn.k_proj: 3 +model.layers.19.self_attn.v_proj: 2 +model.layers.20.self_attn.k_proj: 2 +model.layers.20.self_attn.v_proj: 3 +model.layers.21.self_attn.k_proj: 2 +model.layers.21.self_attn.v_proj: 3 +model.layers.22.self_attn.k_proj: 2 +model.layers.22.self_attn.v_proj: 2 +model.layers.23.self_attn.k_proj: 2 +model.layers.23.self_attn.v_proj: 2 +model.layers.24.self_attn.k_proj: 2 +model.layers.24.self_attn.v_proj: 2 +model.layers.25.self_attn.k_proj: 2 +model.layers.25.self_attn.v_proj: 2 +model.layers.26.self_attn.k_proj: 2 +model.layers.26.self_attn.v_proj: 3 +model.layers.27.self_attn.k_proj: 3 +model.layers.27.self_attn.v_proj: 3 +model.layers.28.self_attn.k_proj: 3 +model.layers.28.self_attn.v_proj: 3 +model.layers.29.self_attn.k_proj: 3 +model.layers.29.self_attn.v_proj: 2 +model.layers.30.self_attn.k_proj: 3 +model.layers.30.self_attn.v_proj: 3 +model.layers.31.self_attn.k_proj: 3 +model.layers.31.self_attn.v_proj: 3 +model.layers.0.self_attn.o_proj: 3 +model.layers.0.self_attn.q_proj: 2 +model.layers.1.self_attn.o_proj: 4 +model.layers.1.self_attn.q_proj: 2 +model.layers.2.self_attn.o_proj: 3 +model.layers.2.self_attn.q_proj: 3 +model.layers.3.self_attn.o_proj: 3 +model.layers.3.self_attn.q_proj: 3 +model.layers.4.self_attn.o_proj: 3 +model.layers.4.self_attn.q_proj: 3 +model.layers.5.self_attn.o_proj: 3 +model.layers.5.self_attn.q_proj: 4 +model.layers.6.self_attn.o_proj: 3 +model.layers.6.self_attn.q_proj: 3 +model.layers.7.self_attn.o_proj: 3 +model.layers.7.self_attn.q_proj: 3 +model.layers.8.self_attn.o_proj: 4 +model.layers.8.self_attn.q_proj: 3 +model.layers.9.self_attn.o_proj: 3 +model.layers.9.self_attn.q_proj: 3 +model.layers.10.self_attn.o_proj: 3 +model.layers.10.self_attn.q_proj: 3 +model.layers.11.self_attn.o_proj: 3 +model.layers.11.self_attn.q_proj: 4 +model.layers.12.self_attn.o_proj: 3 +model.layers.12.self_attn.q_proj: 3 +model.layers.13.self_attn.o_proj: 3 +model.layers.13.self_attn.q_proj: 3 +model.layers.14.self_attn.o_proj: 3 +model.layers.14.self_attn.q_proj: 3 +model.layers.15.self_attn.o_proj: 4 +model.layers.15.self_attn.q_proj: 3 +model.layers.16.self_attn.o_proj: 4 +model.layers.16.self_attn.q_proj: 3 +model.layers.17.self_attn.o_proj: 3 +model.layers.17.self_attn.q_proj: 2 +model.layers.18.self_attn.o_proj: 3 +model.layers.18.self_attn.q_proj: 2 +model.layers.19.self_attn.o_proj: 2 +model.layers.19.self_attn.q_proj: 3 +model.layers.20.self_attn.o_proj: 3 +model.layers.20.self_attn.q_proj: 3 +model.layers.21.self_attn.o_proj: 3 +model.layers.21.self_attn.q_proj: 3 +model.layers.22.self_attn.o_proj: 2 +model.layers.22.self_attn.q_proj: 3 +model.layers.23.self_attn.o_proj: 2 +model.layers.23.self_attn.q_proj: 3 +model.layers.24.self_attn.o_proj: 2 +model.layers.24.self_attn.q_proj: 2 +model.layers.25.self_attn.o_proj: 3 +model.layers.25.self_attn.q_proj: 3 +model.layers.26.self_attn.o_proj: 2 +model.layers.26.self_attn.q_proj: 2 +model.layers.27.self_attn.o_proj: 2 +model.layers.27.self_attn.q_proj: 2 +model.layers.28.self_attn.o_proj: 3 +model.layers.28.self_attn.q_proj: 2 +model.layers.29.self_attn.o_proj: 2 +model.layers.29.self_attn.q_proj: 3 +model.layers.30.self_attn.o_proj: 3 +model.layers.30.self_attn.q_proj: 2 +model.layers.31.self_attn.o_proj: 3 +model.layers.31.self_attn.q_proj: 2 \ No newline at end of file diff --git a/evo-kl-configuration-3.0-v2.txt b/evo-kl-configuration-3.0-v2.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe69443aa5459c48ebe6b0da40b780a781464e50 --- /dev/null +++ b/evo-kl-configuration-3.0-v2.txt @@ -0,0 +1,224 @@ +model.layers.0.mlp.down_proj: 4 +model.layers.0.mlp.gate_proj: 3 +model.layers.0.mlp.up_proj: 3 +model.layers.1.mlp.down_proj: 4 +model.layers.1.mlp.gate_proj: 3 +model.layers.1.mlp.up_proj: 3 +model.layers.2.mlp.down_proj: 3 +model.layers.2.mlp.gate_proj: 3 +model.layers.2.mlp.up_proj: 3 +model.layers.3.mlp.down_proj: 4 +model.layers.3.mlp.gate_proj: 3 +model.layers.3.mlp.up_proj: 3 +model.layers.4.mlp.down_proj: 3 +model.layers.4.mlp.gate_proj: 3 +model.layers.4.mlp.up_proj: 4 +model.layers.5.mlp.down_proj: 3 +model.layers.5.mlp.gate_proj: 2 +model.layers.5.mlp.up_proj: 3 +model.layers.6.mlp.down_proj: 3 +model.layers.6.mlp.gate_proj: 3 +model.layers.6.mlp.up_proj: 3 +model.layers.7.mlp.down_proj: 3 +model.layers.7.mlp.gate_proj: 3 +model.layers.7.mlp.up_proj: 3 +model.layers.8.mlp.down_proj: 3 +model.layers.8.mlp.gate_proj: 3 +model.layers.8.mlp.up_proj: 3 +model.layers.9.mlp.down_proj: 3 +model.layers.9.mlp.gate_proj: 3 +model.layers.9.mlp.up_proj: 3 +model.layers.10.mlp.down_proj: 3 +model.layers.10.mlp.gate_proj: 3 +model.layers.10.mlp.up_proj: 3 +model.layers.11.mlp.down_proj: 3 +model.layers.11.mlp.gate_proj: 3 +model.layers.11.mlp.up_proj: 3 +model.layers.12.mlp.down_proj: 3 +model.layers.12.mlp.gate_proj: 3 +model.layers.12.mlp.up_proj: 3 +model.layers.13.mlp.down_proj: 3 +model.layers.13.mlp.gate_proj: 3 +model.layers.13.mlp.up_proj: 3 +model.layers.14.mlp.down_proj: 3 +model.layers.14.mlp.gate_proj: 3 +model.layers.14.mlp.up_proj: 3 +model.layers.15.mlp.down_proj: 3 +model.layers.15.mlp.gate_proj: 3 +model.layers.15.mlp.up_proj: 3 +model.layers.16.mlp.down_proj: 3 +model.layers.16.mlp.gate_proj: 2 +model.layers.16.mlp.up_proj: 3 +model.layers.17.mlp.down_proj: 3 +model.layers.17.mlp.gate_proj: 3 +model.layers.17.mlp.up_proj: 3 +model.layers.18.mlp.down_proj: 3 +model.layers.18.mlp.gate_proj: 2 +model.layers.18.mlp.up_proj: 3 +model.layers.19.mlp.down_proj: 3 +model.layers.19.mlp.gate_proj: 3 +model.layers.19.mlp.up_proj: 3 +model.layers.20.mlp.down_proj: 3 +model.layers.20.mlp.gate_proj: 3 +model.layers.20.mlp.up_proj: 3 +model.layers.21.mlp.down_proj: 3 +model.layers.21.mlp.gate_proj: 3 +model.layers.21.mlp.up_proj: 3 +model.layers.22.mlp.down_proj: 2 +model.layers.22.mlp.gate_proj: 3 +model.layers.22.mlp.up_proj: 3 +model.layers.23.mlp.down_proj: 3 +model.layers.23.mlp.gate_proj: 3 +model.layers.23.mlp.up_proj: 3 +model.layers.24.mlp.down_proj: 3 +model.layers.24.mlp.gate_proj: 2 +model.layers.24.mlp.up_proj: 3 +model.layers.25.mlp.down_proj: 3 +model.layers.25.mlp.gate_proj: 3 +model.layers.25.mlp.up_proj: 3 +model.layers.26.mlp.down_proj: 3 +model.layers.26.mlp.gate_proj: 2 +model.layers.26.mlp.up_proj: 3 +model.layers.27.mlp.down_proj: 3 +model.layers.27.mlp.gate_proj: 3 +model.layers.27.mlp.up_proj: 3 +model.layers.28.mlp.down_proj: 3 +model.layers.28.mlp.gate_proj: 3 +model.layers.28.mlp.up_proj: 3 +model.layers.29.mlp.down_proj: 3 +model.layers.29.mlp.gate_proj: 3 +model.layers.29.mlp.up_proj: 3 +model.layers.30.mlp.down_proj: 3 +model.layers.30.mlp.gate_proj: 3 +model.layers.30.mlp.up_proj: 3 +model.layers.31.mlp.down_proj: 4 +model.layers.31.mlp.gate_proj: 3 +model.layers.31.mlp.up_proj: 3 +model.layers.0.self_attn.k_proj: 3 +model.layers.0.self_attn.v_proj: 3 +model.layers.1.self_attn.k_proj: 3 +model.layers.1.self_attn.v_proj: 6 +model.layers.2.self_attn.k_proj: 3 +model.layers.2.self_attn.v_proj: 3 +model.layers.3.self_attn.k_proj: 4 +model.layers.3.self_attn.v_proj: 3 +model.layers.4.self_attn.k_proj: 3 +model.layers.4.self_attn.v_proj: 4 +model.layers.5.self_attn.k_proj: 3 +model.layers.5.self_attn.v_proj: 3 +model.layers.6.self_attn.k_proj: 3 +model.layers.6.self_attn.v_proj: 3 +model.layers.7.self_attn.k_proj: 3 +model.layers.7.self_attn.v_proj: 4 +model.layers.8.self_attn.k_proj: 3 +model.layers.8.self_attn.v_proj: 4 +model.layers.9.self_attn.k_proj: 4 +model.layers.9.self_attn.v_proj: 3 +model.layers.10.self_attn.k_proj: 3 +model.layers.10.self_attn.v_proj: 3 +model.layers.11.self_attn.k_proj: 4 +model.layers.11.self_attn.v_proj: 4 +model.layers.12.self_attn.k_proj: 3 +model.layers.12.self_attn.v_proj: 3 +model.layers.13.self_attn.k_proj: 3 +model.layers.13.self_attn.v_proj: 3 +model.layers.14.self_attn.k_proj: 3 +model.layers.14.self_attn.v_proj: 3 +model.layers.15.self_attn.k_proj: 3 +model.layers.15.self_attn.v_proj: 3 +model.layers.16.self_attn.k_proj: 3 +model.layers.16.self_attn.v_proj: 4 +model.layers.17.self_attn.k_proj: 3 +model.layers.17.self_attn.v_proj: 3 +model.layers.18.self_attn.k_proj: 2 +model.layers.18.self_attn.v_proj: 3 +model.layers.19.self_attn.k_proj: 3 +model.layers.19.self_attn.v_proj: 3 +model.layers.20.self_attn.k_proj: 2 +model.layers.20.self_attn.v_proj: 3 +model.layers.21.self_attn.k_proj: 2 +model.layers.21.self_attn.v_proj: 3 +model.layers.22.self_attn.k_proj: 3 +model.layers.22.self_attn.v_proj: 2 +model.layers.23.self_attn.k_proj: 3 +model.layers.23.self_attn.v_proj: 2 +model.layers.24.self_attn.k_proj: 3 +model.layers.24.self_attn.v_proj: 2 +model.layers.25.self_attn.k_proj: 3 +model.layers.25.self_attn.v_proj: 2 +model.layers.26.self_attn.k_proj: 2 +model.layers.26.self_attn.v_proj: 2 +model.layers.27.self_attn.k_proj: 2 +model.layers.27.self_attn.v_proj: 3 +model.layers.28.self_attn.k_proj: 3 +model.layers.28.self_attn.v_proj: 4 +model.layers.29.self_attn.k_proj: 2 +model.layers.29.self_attn.v_proj: 3 +model.layers.30.self_attn.k_proj: 3 +model.layers.30.self_attn.v_proj: 3 +model.layers.31.self_attn.k_proj: 3 +model.layers.31.self_attn.v_proj: 3 +model.layers.0.self_attn.o_proj: 3 +model.layers.0.self_attn.q_proj: 2 +model.layers.1.self_attn.o_proj: 4 +model.layers.1.self_attn.q_proj: 4 +model.layers.2.self_attn.o_proj: 3 +model.layers.2.self_attn.q_proj: 3 +model.layers.3.self_attn.o_proj: 3 +model.layers.3.self_attn.q_proj: 3 +model.layers.4.self_attn.o_proj: 3 +model.layers.4.self_attn.q_proj: 3 +model.layers.5.self_attn.o_proj: 3 +model.layers.5.self_attn.q_proj: 4 +model.layers.6.self_attn.o_proj: 3 +model.layers.6.self_attn.q_proj: 3 +model.layers.7.self_attn.o_proj: 3 +model.layers.7.self_attn.q_proj: 4 +model.layers.8.self_attn.o_proj: 4 +model.layers.8.self_attn.q_proj: 3 +model.layers.9.self_attn.o_proj: 4 +model.layers.9.self_attn.q_proj: 3 +model.layers.10.self_attn.o_proj: 3 +model.layers.10.self_attn.q_proj: 3 +model.layers.11.self_attn.o_proj: 3 +model.layers.11.self_attn.q_proj: 3 +model.layers.12.self_attn.o_proj: 3 +model.layers.12.self_attn.q_proj: 4 +model.layers.13.self_attn.o_proj: 4 +model.layers.13.self_attn.q_proj: 3 +model.layers.14.self_attn.o_proj: 4 +model.layers.14.self_attn.q_proj: 3 +model.layers.15.self_attn.o_proj: 3 +model.layers.15.self_attn.q_proj: 3 +model.layers.16.self_attn.o_proj: 3 +model.layers.16.self_attn.q_proj: 3 +model.layers.17.self_attn.o_proj: 3 +model.layers.17.self_attn.q_proj: 3 +model.layers.18.self_attn.o_proj: 3 +model.layers.18.self_attn.q_proj: 3 +model.layers.19.self_attn.o_proj: 3 +model.layers.19.self_attn.q_proj: 3 +model.layers.20.self_attn.o_proj: 3 +model.layers.20.self_attn.q_proj: 3 +model.layers.21.self_attn.o_proj: 3 +model.layers.21.self_attn.q_proj: 3 +model.layers.22.self_attn.o_proj: 3 +model.layers.22.self_attn.q_proj: 2 +model.layers.23.self_attn.o_proj: 3 +model.layers.23.self_attn.q_proj: 2 +model.layers.24.self_attn.o_proj: 2 +model.layers.24.self_attn.q_proj: 2 +model.layers.25.self_attn.o_proj: 2 +model.layers.25.self_attn.q_proj: 3 +model.layers.26.self_attn.o_proj: 2 +model.layers.26.self_attn.q_proj: 3 +model.layers.27.self_attn.o_proj: 3 +model.layers.27.self_attn.q_proj: 2 +model.layers.28.self_attn.o_proj: 3 +model.layers.28.self_attn.q_proj: 2 +model.layers.29.self_attn.o_proj: 3 +model.layers.29.self_attn.q_proj: 3 +model.layers.30.self_attn.o_proj: 3 +model.layers.30.self_attn.q_proj: 3 +model.layers.31.self_attn.o_proj: 3 +model.layers.31.self_attn.q_proj: 3 \ No newline at end of file diff --git a/evo-kl-configuration-3.25-v2.txt b/evo-kl-configuration-3.25-v2.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c9a1a2997c366b0ac2f31c47f22d7a26484f40f --- /dev/null +++ b/evo-kl-configuration-3.25-v2.txt @@ -0,0 +1,224 @@ +model.layers.0.mlp.down_proj: 4 +model.layers.0.mlp.gate_proj: 3 +model.layers.0.mlp.up_proj: 3 +model.layers.1.mlp.down_proj: 4 +model.layers.1.mlp.gate_proj: 3 +model.layers.1.mlp.up_proj: 3 +model.layers.2.mlp.down_proj: 3 +model.layers.2.mlp.gate_proj: 3 +model.layers.2.mlp.up_proj: 3 +model.layers.3.mlp.down_proj: 3 +model.layers.3.mlp.gate_proj: 3 +model.layers.3.mlp.up_proj: 4 +model.layers.4.mlp.down_proj: 3 +model.layers.4.mlp.gate_proj: 3 +model.layers.4.mlp.up_proj: 4 +model.layers.5.mlp.down_proj: 3 +model.layers.5.mlp.gate_proj: 3 +model.layers.5.mlp.up_proj: 4 +model.layers.6.mlp.down_proj: 3 +model.layers.6.mlp.gate_proj: 2 +model.layers.6.mlp.up_proj: 3 +model.layers.7.mlp.down_proj: 4 +model.layers.7.mlp.gate_proj: 3 +model.layers.7.mlp.up_proj: 3 +model.layers.8.mlp.down_proj: 4 +model.layers.8.mlp.gate_proj: 3 +model.layers.8.mlp.up_proj: 3 +model.layers.9.mlp.down_proj: 3 +model.layers.9.mlp.gate_proj: 3 +model.layers.9.mlp.up_proj: 3 +model.layers.10.mlp.down_proj: 3 +model.layers.10.mlp.gate_proj: 3 +model.layers.10.mlp.up_proj: 3 +model.layers.11.mlp.down_proj: 3 +model.layers.11.mlp.gate_proj: 3 +model.layers.11.mlp.up_proj: 3 +model.layers.12.mlp.down_proj: 3 +model.layers.12.mlp.gate_proj: 3 +model.layers.12.mlp.up_proj: 3 +model.layers.13.mlp.down_proj: 3 +model.layers.13.mlp.gate_proj: 3 +model.layers.13.mlp.up_proj: 4 +model.layers.14.mlp.down_proj: 3 +model.layers.14.mlp.gate_proj: 3 +model.layers.14.mlp.up_proj: 3 +model.layers.15.mlp.down_proj: 3 +model.layers.15.mlp.gate_proj: 3 +model.layers.15.mlp.up_proj: 3 +model.layers.16.mlp.down_proj: 4 +model.layers.16.mlp.gate_proj: 3 +model.layers.16.mlp.up_proj: 3 +model.layers.17.mlp.down_proj: 4 +model.layers.17.mlp.gate_proj: 3 +model.layers.17.mlp.up_proj: 3 +model.layers.18.mlp.down_proj: 4 +model.layers.18.mlp.gate_proj: 3 +model.layers.18.mlp.up_proj: 3 +model.layers.19.mlp.down_proj: 3 +model.layers.19.mlp.gate_proj: 3 +model.layers.19.mlp.up_proj: 3 +model.layers.20.mlp.down_proj: 3 +model.layers.20.mlp.gate_proj: 3 +model.layers.20.mlp.up_proj: 3 +model.layers.21.mlp.down_proj: 3 +model.layers.21.mlp.gate_proj: 3 +model.layers.21.mlp.up_proj: 4 +model.layers.22.mlp.down_proj: 4 +model.layers.22.mlp.gate_proj: 3 +model.layers.22.mlp.up_proj: 3 +model.layers.23.mlp.down_proj: 3 +model.layers.23.mlp.gate_proj: 3 +model.layers.23.mlp.up_proj: 3 +model.layers.24.mlp.down_proj: 3 +model.layers.24.mlp.gate_proj: 3 +model.layers.24.mlp.up_proj: 3 +model.layers.25.mlp.down_proj: 3 +model.layers.25.mlp.gate_proj: 3 +model.layers.25.mlp.up_proj: 3 +model.layers.26.mlp.down_proj: 3 +model.layers.26.mlp.gate_proj: 3 +model.layers.26.mlp.up_proj: 3 +model.layers.27.mlp.down_proj: 3 +model.layers.27.mlp.gate_proj: 3 +model.layers.27.mlp.up_proj: 3 +model.layers.28.mlp.down_proj: 3 +model.layers.28.mlp.gate_proj: 3 +model.layers.28.mlp.up_proj: 3 +model.layers.29.mlp.down_proj: 3 +model.layers.29.mlp.gate_proj: 3 +model.layers.29.mlp.up_proj: 3 +model.layers.30.mlp.down_proj: 4 +model.layers.30.mlp.gate_proj: 3 +model.layers.30.mlp.up_proj: 4 +model.layers.31.mlp.down_proj: 4 +model.layers.31.mlp.gate_proj: 4 +model.layers.31.mlp.up_proj: 6 +model.layers.0.self_attn.k_proj: 3 +model.layers.0.self_attn.v_proj: 4 +model.layers.1.self_attn.k_proj: 3 +model.layers.1.self_attn.v_proj: 8 +model.layers.2.self_attn.k_proj: 3 +model.layers.2.self_attn.v_proj: 4 +model.layers.3.self_attn.k_proj: 3 +model.layers.3.self_attn.v_proj: 6 +model.layers.4.self_attn.k_proj: 3 +model.layers.4.self_attn.v_proj: 4 +model.layers.5.self_attn.k_proj: 4 +model.layers.5.self_attn.v_proj: 3 +model.layers.6.self_attn.k_proj: 3 +model.layers.6.self_attn.v_proj: 3 +model.layers.7.self_attn.k_proj: 3 +model.layers.7.self_attn.v_proj: 4 +model.layers.8.self_attn.k_proj: 4 +model.layers.8.self_attn.v_proj: 4 +model.layers.9.self_attn.k_proj: 6 +model.layers.9.self_attn.v_proj: 3 +model.layers.10.self_attn.k_proj: 4 +model.layers.10.self_attn.v_proj: 3 +model.layers.11.self_attn.k_proj: 4 +model.layers.11.self_attn.v_proj: 3 +model.layers.12.self_attn.k_proj: 4 +model.layers.12.self_attn.v_proj: 3 +model.layers.13.self_attn.k_proj: 4 +model.layers.13.self_attn.v_proj: 3 +model.layers.14.self_attn.k_proj: 3 +model.layers.14.self_attn.v_proj: 3 +model.layers.15.self_attn.k_proj: 4 +model.layers.15.self_attn.v_proj: 6 +model.layers.16.self_attn.k_proj: 4 +model.layers.16.self_attn.v_proj: 3 +model.layers.17.self_attn.k_proj: 3 +model.layers.17.self_attn.v_proj: 3 +model.layers.18.self_attn.k_proj: 3 +model.layers.18.self_attn.v_proj: 4 +model.layers.19.self_attn.k_proj: 4 +model.layers.19.self_attn.v_proj: 3 +model.layers.20.self_attn.k_proj: 3 +model.layers.20.self_attn.v_proj: 3 +model.layers.21.self_attn.k_proj: 3 +model.layers.21.self_attn.v_proj: 3 +model.layers.22.self_attn.k_proj: 4 +model.layers.22.self_attn.v_proj: 3 +model.layers.23.self_attn.k_proj: 3 +model.layers.23.self_attn.v_proj: 2 +model.layers.24.self_attn.k_proj: 3 +model.layers.24.self_attn.v_proj: 3 +model.layers.25.self_attn.k_proj: 3 +model.layers.25.self_attn.v_proj: 2 +model.layers.26.self_attn.k_proj: 3 +model.layers.26.self_attn.v_proj: 3 +model.layers.27.self_attn.k_proj: 3 +model.layers.27.self_attn.v_proj: 3 +model.layers.28.self_attn.k_proj: 3 +model.layers.28.self_attn.v_proj: 2 +model.layers.29.self_attn.k_proj: 3 +model.layers.29.self_attn.v_proj: 4 +model.layers.30.self_attn.k_proj: 3 +model.layers.30.self_attn.v_proj: 4 +model.layers.31.self_attn.k_proj: 3 +model.layers.31.self_attn.v_proj: 3 +model.layers.0.self_attn.o_proj: 6 +model.layers.0.self_attn.q_proj: 3 +model.layers.1.self_attn.o_proj: 4 +model.layers.1.self_attn.q_proj: 4 +model.layers.2.self_attn.o_proj: 4 +model.layers.2.self_attn.q_proj: 3 +model.layers.3.self_attn.o_proj: 3 +model.layers.3.self_attn.q_proj: 4 +model.layers.4.self_attn.o_proj: 4 +model.layers.4.self_attn.q_proj: 3 +model.layers.5.self_attn.o_proj: 3 +model.layers.5.self_attn.q_proj: 4 +model.layers.6.self_attn.o_proj: 3 +model.layers.6.self_attn.q_proj: 4 +model.layers.7.self_attn.o_proj: 4 +model.layers.7.self_attn.q_proj: 4 +model.layers.8.self_attn.o_proj: 4 +model.layers.8.self_attn.q_proj: 3 +model.layers.9.self_attn.o_proj: 4 +model.layers.9.self_attn.q_proj: 3 +model.layers.10.self_attn.o_proj: 4 +model.layers.10.self_attn.q_proj: 3 +model.layers.11.self_attn.o_proj: 4 +model.layers.11.self_attn.q_proj: 4 +model.layers.12.self_attn.o_proj: 4 +model.layers.12.self_attn.q_proj: 4 +model.layers.13.self_attn.o_proj: 4 +model.layers.13.self_attn.q_proj: 4 +model.layers.14.self_attn.o_proj: 4 +model.layers.14.self_attn.q_proj: 4 +model.layers.15.self_attn.o_proj: 4 +model.layers.15.self_attn.q_proj: 3 +model.layers.16.self_attn.o_proj: 3 +model.layers.16.self_attn.q_proj: 3 +model.layers.17.self_attn.o_proj: 3 +model.layers.17.self_attn.q_proj: 3 +model.layers.18.self_attn.o_proj: 3 +model.layers.18.self_attn.q_proj: 3 +model.layers.19.self_attn.o_proj: 3 +model.layers.19.self_attn.q_proj: 3 +model.layers.20.self_attn.o_proj: 3 +model.layers.20.self_attn.q_proj: 3 +model.layers.21.self_attn.o_proj: 4 +model.layers.21.self_attn.q_proj: 3 +model.layers.22.self_attn.o_proj: 3 +model.layers.22.self_attn.q_proj: 3 +model.layers.23.self_attn.o_proj: 2 +model.layers.23.self_attn.q_proj: 3 +model.layers.24.self_attn.o_proj: 2 +model.layers.24.self_attn.q_proj: 3 +model.layers.25.self_attn.o_proj: 3 +model.layers.25.self_attn.q_proj: 3 +model.layers.26.self_attn.o_proj: 4 +model.layers.26.self_attn.q_proj: 2 +model.layers.27.self_attn.o_proj: 3 +model.layers.27.self_attn.q_proj: 3 +model.layers.28.self_attn.o_proj: 6 +model.layers.28.self_attn.q_proj: 2 +model.layers.29.self_attn.o_proj: 3 +model.layers.29.self_attn.q_proj: 4 +model.layers.30.self_attn.o_proj: 3 +model.layers.30.self_attn.q_proj: 4 +model.layers.31.self_attn.o_proj: 3 +model.layers.31.self_attn.q_proj: 3 \ No newline at end of file diff --git a/evo-kl-configuration-3.5-v2.txt b/evo-kl-configuration-3.5-v2.txt new file mode 100644 index 0000000000000000000000000000000000000000..a7ed365fe97564d79285840c22dc09a485d13316 --- /dev/null +++ b/evo-kl-configuration-3.5-v2.txt @@ -0,0 +1,224 @@ +model.layers.0.mlp.down_proj: 4 +model.layers.0.mlp.gate_proj: 3 +model.layers.0.mlp.up_proj: 3 +model.layers.1.mlp.down_proj: 4 +model.layers.1.mlp.gate_proj: 4 +model.layers.1.mlp.up_proj: 3 +model.layers.2.mlp.down_proj: 4 +model.layers.2.mlp.gate_proj: 3 +model.layers.2.mlp.up_proj: 3 +model.layers.3.mlp.down_proj: 4 +model.layers.3.mlp.gate_proj: 3 +model.layers.3.mlp.up_proj: 4 +model.layers.4.mlp.down_proj: 4 +model.layers.4.mlp.gate_proj: 4 +model.layers.4.mlp.up_proj: 4 +model.layers.5.mlp.down_proj: 4 +model.layers.5.mlp.gate_proj: 3 +model.layers.5.mlp.up_proj: 4 +model.layers.6.mlp.down_proj: 4 +model.layers.6.mlp.gate_proj: 3 +model.layers.6.mlp.up_proj: 3 +model.layers.7.mlp.down_proj: 4 +model.layers.7.mlp.gate_proj: 3 +model.layers.7.mlp.up_proj: 3 +model.layers.8.mlp.down_proj: 4 +model.layers.8.mlp.gate_proj: 4 +model.layers.8.mlp.up_proj: 3 +model.layers.9.mlp.down_proj: 4 +model.layers.9.mlp.gate_proj: 3 +model.layers.9.mlp.up_proj: 4 +model.layers.10.mlp.down_proj: 4 +model.layers.10.mlp.gate_proj: 3 +model.layers.10.mlp.up_proj: 3 +model.layers.11.mlp.down_proj: 3 +model.layers.11.mlp.gate_proj: 3 +model.layers.11.mlp.up_proj: 4 +model.layers.12.mlp.down_proj: 4 +model.layers.12.mlp.gate_proj: 4 +model.layers.12.mlp.up_proj: 4 +model.layers.13.mlp.down_proj: 4 +model.layers.13.mlp.gate_proj: 3 +model.layers.13.mlp.up_proj: 4 +model.layers.14.mlp.down_proj: 3 +model.layers.14.mlp.gate_proj: 3 +model.layers.14.mlp.up_proj: 3 +model.layers.15.mlp.down_proj: 3 +model.layers.15.mlp.gate_proj: 3 +model.layers.15.mlp.up_proj: 4 +model.layers.16.mlp.down_proj: 3 +model.layers.16.mlp.gate_proj: 3 +model.layers.16.mlp.up_proj: 3 +model.layers.17.mlp.down_proj: 4 +model.layers.17.mlp.gate_proj: 3 +model.layers.17.mlp.up_proj: 3 +model.layers.18.mlp.down_proj: 4 +model.layers.18.mlp.gate_proj: 3 +model.layers.18.mlp.up_proj: 4 +model.layers.19.mlp.down_proj: 3 +model.layers.19.mlp.gate_proj: 3 +model.layers.19.mlp.up_proj: 4 +model.layers.20.mlp.down_proj: 4 +model.layers.20.mlp.gate_proj: 4 +model.layers.20.mlp.up_proj: 3 +model.layers.21.mlp.down_proj: 4 +model.layers.21.mlp.gate_proj: 3 +model.layers.21.mlp.up_proj: 3 +model.layers.22.mlp.down_proj: 4 +model.layers.22.mlp.gate_proj: 3 +model.layers.22.mlp.up_proj: 3 +model.layers.23.mlp.down_proj: 3 +model.layers.23.mlp.gate_proj: 3 +model.layers.23.mlp.up_proj: 4 +model.layers.24.mlp.down_proj: 3 +model.layers.24.mlp.gate_proj: 3 +model.layers.24.mlp.up_proj: 3 +model.layers.25.mlp.down_proj: 4 +model.layers.25.mlp.gate_proj: 3 +model.layers.25.mlp.up_proj: 3 +model.layers.26.mlp.down_proj: 3 +model.layers.26.mlp.gate_proj: 3 +model.layers.26.mlp.up_proj: 4 +model.layers.27.mlp.down_proj: 3 +model.layers.27.mlp.gate_proj: 4 +model.layers.27.mlp.up_proj: 4 +model.layers.28.mlp.down_proj: 4 +model.layers.28.mlp.gate_proj: 3 +model.layers.28.mlp.up_proj: 3 +model.layers.29.mlp.down_proj: 3 +model.layers.29.mlp.gate_proj: 3 +model.layers.29.mlp.up_proj: 3 +model.layers.30.mlp.down_proj: 4 +model.layers.30.mlp.gate_proj: 3 +model.layers.30.mlp.up_proj: 4 +model.layers.31.mlp.down_proj: 4 +model.layers.31.mlp.gate_proj: 4 +model.layers.31.mlp.up_proj: 4 +model.layers.0.self_attn.k_proj: 3 +model.layers.0.self_attn.v_proj: 8 +model.layers.1.self_attn.k_proj: 4 +model.layers.1.self_attn.v_proj: 6 +model.layers.2.self_attn.k_proj: 6 +model.layers.2.self_attn.v_proj: 6 +model.layers.3.self_attn.k_proj: 4 +model.layers.3.self_attn.v_proj: 4 +model.layers.4.self_attn.k_proj: 4 +model.layers.4.self_attn.v_proj: 4 +model.layers.5.self_attn.k_proj: 4 +model.layers.5.self_attn.v_proj: 3 +model.layers.6.self_attn.k_proj: 3 +model.layers.6.self_attn.v_proj: 4 +model.layers.7.self_attn.k_proj: 3 +model.layers.7.self_attn.v_proj: 3 +model.layers.8.self_attn.k_proj: 4 +model.layers.8.self_attn.v_proj: 4 +model.layers.9.self_attn.k_proj: 4 +model.layers.9.self_attn.v_proj: 3 +model.layers.10.self_attn.k_proj: 3 +model.layers.10.self_attn.v_proj: 4 +model.layers.11.self_attn.k_proj: 4 +model.layers.11.self_attn.v_proj: 4 +model.layers.12.self_attn.k_proj: 4 +model.layers.12.self_attn.v_proj: 4 +model.layers.13.self_attn.k_proj: 4 +model.layers.13.self_attn.v_proj: 3 +model.layers.14.self_attn.k_proj: 3 +model.layers.14.self_attn.v_proj: 3 +model.layers.15.self_attn.k_proj: 4 +model.layers.15.self_attn.v_proj: 6 +model.layers.16.self_attn.k_proj: 3 +model.layers.16.self_attn.v_proj: 4 +model.layers.17.self_attn.k_proj: 3 +model.layers.17.self_attn.v_proj: 3 +model.layers.18.self_attn.k_proj: 3 +model.layers.18.self_attn.v_proj: 4 +model.layers.19.self_attn.k_proj: 3 +model.layers.19.self_attn.v_proj: 4 +model.layers.20.self_attn.k_proj: 3 +model.layers.20.self_attn.v_proj: 4 +model.layers.21.self_attn.k_proj: 3 +model.layers.21.self_attn.v_proj: 4 +model.layers.22.self_attn.k_proj: 3 +model.layers.22.self_attn.v_proj: 3 +model.layers.23.self_attn.k_proj: 3 +model.layers.23.self_attn.v_proj: 3 +model.layers.24.self_attn.k_proj: 3 +model.layers.24.self_attn.v_proj: 3 +model.layers.25.self_attn.k_proj: 3 +model.layers.25.self_attn.v_proj: 3 +model.layers.26.self_attn.k_proj: 3 +model.layers.26.self_attn.v_proj: 4 +model.layers.27.self_attn.k_proj: 3 +model.layers.27.self_attn.v_proj: 4 +model.layers.28.self_attn.k_proj: 3 +model.layers.28.self_attn.v_proj: 4 +model.layers.29.self_attn.k_proj: 3 +model.layers.29.self_attn.v_proj: 4 +model.layers.30.self_attn.k_proj: 3 +model.layers.30.self_attn.v_proj: 3 +model.layers.31.self_attn.k_proj: 3 +model.layers.31.self_attn.v_proj: 3 +model.layers.0.self_attn.o_proj: 6 +model.layers.0.self_attn.q_proj: 3 +model.layers.1.self_attn.o_proj: 4 +model.layers.1.self_attn.q_proj: 3 +model.layers.2.self_attn.o_proj: 4 +model.layers.2.self_attn.q_proj: 4 +model.layers.3.self_attn.o_proj: 4 +model.layers.3.self_attn.q_proj: 4 +model.layers.4.self_attn.o_proj: 4 +model.layers.4.self_attn.q_proj: 4 +model.layers.5.self_attn.o_proj: 3 +model.layers.5.self_attn.q_proj: 4 +model.layers.6.self_attn.o_proj: 3 +model.layers.6.self_attn.q_proj: 4 +model.layers.7.self_attn.o_proj: 4 +model.layers.7.self_attn.q_proj: 4 +model.layers.8.self_attn.o_proj: 6 +model.layers.8.self_attn.q_proj: 3 +model.layers.9.self_attn.o_proj: 4 +model.layers.9.self_attn.q_proj: 4 +model.layers.10.self_attn.o_proj: 4 +model.layers.10.self_attn.q_proj: 4 +model.layers.11.self_attn.o_proj: 3 +model.layers.11.self_attn.q_proj: 4 +model.layers.12.self_attn.o_proj: 4 +model.layers.12.self_attn.q_proj: 4 +model.layers.13.self_attn.o_proj: 8 +model.layers.13.self_attn.q_proj: 4 +model.layers.14.self_attn.o_proj: 4 +model.layers.14.self_attn.q_proj: 4 +model.layers.15.self_attn.o_proj: 4 +model.layers.15.self_attn.q_proj: 3 +model.layers.16.self_attn.o_proj: 3 +model.layers.16.self_attn.q_proj: 4 +model.layers.17.self_attn.o_proj: 3 +model.layers.17.self_attn.q_proj: 3 +model.layers.18.self_attn.o_proj: 3 +model.layers.18.self_attn.q_proj: 3 +model.layers.19.self_attn.o_proj: 3 +model.layers.19.self_attn.q_proj: 3 +model.layers.20.self_attn.o_proj: 3 +model.layers.20.self_attn.q_proj: 3 +model.layers.21.self_attn.o_proj: 3 +model.layers.21.self_attn.q_proj: 3 +model.layers.22.self_attn.o_proj: 3 +model.layers.22.self_attn.q_proj: 3 +model.layers.23.self_attn.o_proj: 4 +model.layers.23.self_attn.q_proj: 3 +model.layers.24.self_attn.o_proj: 3 +model.layers.24.self_attn.q_proj: 3 +model.layers.25.self_attn.o_proj: 4 +model.layers.25.self_attn.q_proj: 3 +model.layers.26.self_attn.o_proj: 3 +model.layers.26.self_attn.q_proj: 4 +model.layers.27.self_attn.o_proj: 3 +model.layers.27.self_attn.q_proj: 3 +model.layers.28.self_attn.o_proj: 3 +model.layers.28.self_attn.q_proj: 3 +model.layers.29.self_attn.o_proj: 4 +model.layers.29.self_attn.q_proj: 4 +model.layers.30.self_attn.o_proj: 3 +model.layers.30.self_attn.q_proj: 4 +model.layers.31.self_attn.o_proj: 3 +model.layers.31.self_attn.q_proj: 3 \ No newline at end of file diff --git a/evo-kl-configuration-3.75-v2.txt b/evo-kl-configuration-3.75-v2.txt new file mode 100644 index 0000000000000000000000000000000000000000..871e9d5a1f5dc89869f12e500a6d570dc39c91e6 --- /dev/null +++ b/evo-kl-configuration-3.75-v2.txt @@ -0,0 +1,224 @@ +model.layers.0.mlp.down_proj: 4 +model.layers.0.mlp.gate_proj: 3 +model.layers.0.mlp.up_proj: 4 +model.layers.1.mlp.down_proj: 4 +model.layers.1.mlp.gate_proj: 4 +model.layers.1.mlp.up_proj: 4 +model.layers.2.mlp.down_proj: 4 +model.layers.2.mlp.gate_proj: 4 +model.layers.2.mlp.up_proj: 4 +model.layers.3.mlp.down_proj: 4 +model.layers.3.mlp.gate_proj: 3 +model.layers.3.mlp.up_proj: 4 +model.layers.4.mlp.down_proj: 4 +model.layers.4.mlp.gate_proj: 3 +model.layers.4.mlp.up_proj: 4 +model.layers.5.mlp.down_proj: 4 +model.layers.5.mlp.gate_proj: 3 +model.layers.5.mlp.up_proj: 4 +model.layers.6.mlp.down_proj: 4 +model.layers.6.mlp.gate_proj: 3 +model.layers.6.mlp.up_proj: 4 +model.layers.7.mlp.down_proj: 4 +model.layers.7.mlp.gate_proj: 3 +model.layers.7.mlp.up_proj: 4 +model.layers.8.mlp.down_proj: 4 +model.layers.8.mlp.gate_proj: 3 +model.layers.8.mlp.up_proj: 4 +model.layers.9.mlp.down_proj: 3 +model.layers.9.mlp.gate_proj: 3 +model.layers.9.mlp.up_proj: 4 +model.layers.10.mlp.down_proj: 3 +model.layers.10.mlp.gate_proj: 3 +model.layers.10.mlp.up_proj: 3 +model.layers.11.mlp.down_proj: 4 +model.layers.11.mlp.gate_proj: 4 +model.layers.11.mlp.up_proj: 3 +model.layers.12.mlp.down_proj: 4 +model.layers.12.mlp.gate_proj: 4 +model.layers.12.mlp.up_proj: 4 +model.layers.13.mlp.down_proj: 4 +model.layers.13.mlp.gate_proj: 4 +model.layers.13.mlp.up_proj: 4 +model.layers.14.mlp.down_proj: 4 +model.layers.14.mlp.gate_proj: 3 +model.layers.14.mlp.up_proj: 4 +model.layers.15.mlp.down_proj: 4 +model.layers.15.mlp.gate_proj: 3 +model.layers.15.mlp.up_proj: 3 +model.layers.16.mlp.down_proj: 4 +model.layers.16.mlp.gate_proj: 3 +model.layers.16.mlp.up_proj: 4 +model.layers.17.mlp.down_proj: 4 +model.layers.17.mlp.gate_proj: 4 +model.layers.17.mlp.up_proj: 4 +model.layers.18.mlp.down_proj: 4 +model.layers.18.mlp.gate_proj: 4 +model.layers.18.mlp.up_proj: 4 +model.layers.19.mlp.down_proj: 4 +model.layers.19.mlp.gate_proj: 4 +model.layers.19.mlp.up_proj: 4 +model.layers.20.mlp.down_proj: 4 +model.layers.20.mlp.gate_proj: 4 +model.layers.20.mlp.up_proj: 4 +model.layers.21.mlp.down_proj: 4 +model.layers.21.mlp.gate_proj: 3 +model.layers.21.mlp.up_proj: 4 +model.layers.22.mlp.down_proj: 4 +model.layers.22.mlp.gate_proj: 4 +model.layers.22.mlp.up_proj: 4 +model.layers.23.mlp.down_proj: 4 +model.layers.23.mlp.gate_proj: 4 +model.layers.23.mlp.up_proj: 4 +model.layers.24.mlp.down_proj: 3 +model.layers.24.mlp.gate_proj: 4 +model.layers.24.mlp.up_proj: 4 +model.layers.25.mlp.down_proj: 4 +model.layers.25.mlp.gate_proj: 3 +model.layers.25.mlp.up_proj: 3 +model.layers.26.mlp.down_proj: 3 +model.layers.26.mlp.gate_proj: 3 +model.layers.26.mlp.up_proj: 4 +model.layers.27.mlp.down_proj: 3 +model.layers.27.mlp.gate_proj: 4 +model.layers.27.mlp.up_proj: 4 +model.layers.28.mlp.down_proj: 4 +model.layers.28.mlp.gate_proj: 3 +model.layers.28.mlp.up_proj: 3 +model.layers.29.mlp.down_proj: 4 +model.layers.29.mlp.gate_proj: 4 +model.layers.29.mlp.up_proj: 3 +model.layers.30.mlp.down_proj: 4 +model.layers.30.mlp.gate_proj: 4 +model.layers.30.mlp.up_proj: 4 +model.layers.31.mlp.down_proj: 4 +model.layers.31.mlp.gate_proj: 4 +model.layers.31.mlp.up_proj: 4 +model.layers.0.self_attn.k_proj: 4 +model.layers.0.self_attn.v_proj: 6 +model.layers.1.self_attn.k_proj: 3 +model.layers.1.self_attn.v_proj: 8 +model.layers.2.self_attn.k_proj: 4 +model.layers.2.self_attn.v_proj: 4 +model.layers.3.self_attn.k_proj: 4 +model.layers.3.self_attn.v_proj: 6 +model.layers.4.self_attn.k_proj: 3 +model.layers.4.self_attn.v_proj: 4 +model.layers.5.self_attn.k_proj: 4 +model.layers.5.self_attn.v_proj: 3 +model.layers.6.self_attn.k_proj: 4 +model.layers.6.self_attn.v_proj: 4 +model.layers.7.self_attn.k_proj: 4 +model.layers.7.self_attn.v_proj: 4 +model.layers.8.self_attn.k_proj: 6 +model.layers.8.self_attn.v_proj: 3 +model.layers.9.self_attn.k_proj: 6 +model.layers.9.self_attn.v_proj: 4 +model.layers.10.self_attn.k_proj: 4 +model.layers.10.self_attn.v_proj: 3 +model.layers.11.self_attn.k_proj: 4 +model.layers.11.self_attn.v_proj: 4 +model.layers.12.self_attn.k_proj: 4 +model.layers.12.self_attn.v_proj: 4 +model.layers.13.self_attn.k_proj: 4 +model.layers.13.self_attn.v_proj: 3 +model.layers.14.self_attn.k_proj: 3 +model.layers.14.self_attn.v_proj: 6 +model.layers.15.self_attn.k_proj: 4 +model.layers.15.self_attn.v_proj: 6 +model.layers.16.self_attn.k_proj: 4 +model.layers.16.self_attn.v_proj: 6 +model.layers.17.self_attn.k_proj: 4 +model.layers.17.self_attn.v_proj: 3 +model.layers.18.self_attn.k_proj: 3 +model.layers.18.self_attn.v_proj: 4 +model.layers.19.self_attn.k_proj: 4 +model.layers.19.self_attn.v_proj: 3 +model.layers.20.self_attn.k_proj: 3 +model.layers.20.self_attn.v_proj: 6 +model.layers.21.self_attn.k_proj: 3 +model.layers.21.self_attn.v_proj: 4 +model.layers.22.self_attn.k_proj: 3 +model.layers.22.self_attn.v_proj: 3 +model.layers.23.self_attn.k_proj: 3 +model.layers.23.self_attn.v_proj: 3 +model.layers.24.self_attn.k_proj: 4 +model.layers.24.self_attn.v_proj: 3 +model.layers.25.self_attn.k_proj: 4 +model.layers.25.self_attn.v_proj: 3 +model.layers.26.self_attn.k_proj: 3 +model.layers.26.self_attn.v_proj: 3 +model.layers.27.self_attn.k_proj: 3 +model.layers.27.self_attn.v_proj: 4 +model.layers.28.self_attn.k_proj: 4 +model.layers.28.self_attn.v_proj: 4 +model.layers.29.self_attn.k_proj: 3 +model.layers.29.self_attn.v_proj: 4 +model.layers.30.self_attn.k_proj: 3 +model.layers.30.self_attn.v_proj: 3 +model.layers.31.self_attn.k_proj: 3 +model.layers.31.self_attn.v_proj: 4 +model.layers.0.self_attn.o_proj: 4 +model.layers.0.self_attn.q_proj: 3 +model.layers.1.self_attn.o_proj: 4 +model.layers.1.self_attn.q_proj: 4 +model.layers.2.self_attn.o_proj: 4 +model.layers.2.self_attn.q_proj: 4 +model.layers.3.self_attn.o_proj: 3 +model.layers.3.self_attn.q_proj: 4 +model.layers.4.self_attn.o_proj: 4 +model.layers.4.self_attn.q_proj: 4 +model.layers.5.self_attn.o_proj: 4 +model.layers.5.self_attn.q_proj: 4 +model.layers.6.self_attn.o_proj: 4 +model.layers.6.self_attn.q_proj: 3 +model.layers.7.self_attn.o_proj: 4 +model.layers.7.self_attn.q_proj: 4 +model.layers.8.self_attn.o_proj: 4 +model.layers.8.self_attn.q_proj: 4 +model.layers.9.self_attn.o_proj: 6 +model.layers.9.self_attn.q_proj: 4 +model.layers.10.self_attn.o_proj: 4 +model.layers.10.self_attn.q_proj: 4 +model.layers.11.self_attn.o_proj: 4 +model.layers.11.self_attn.q_proj: 4 +model.layers.12.self_attn.o_proj: 4 +model.layers.12.self_attn.q_proj: 4 +model.layers.13.self_attn.o_proj: 4 +model.layers.13.self_attn.q_proj: 4 +model.layers.14.self_attn.o_proj: 4 +model.layers.14.self_attn.q_proj: 6 +model.layers.15.self_attn.o_proj: 4 +model.layers.15.self_attn.q_proj: 6 +model.layers.16.self_attn.o_proj: 6 +model.layers.16.self_attn.q_proj: 4 +model.layers.17.self_attn.o_proj: 4 +model.layers.17.self_attn.q_proj: 3 +model.layers.18.self_attn.o_proj: 4 +model.layers.18.self_attn.q_proj: 4 +model.layers.19.self_attn.o_proj: 3 +model.layers.19.self_attn.q_proj: 4 +model.layers.20.self_attn.o_proj: 4 +model.layers.20.self_attn.q_proj: 3 +model.layers.21.self_attn.o_proj: 3 +model.layers.21.self_attn.q_proj: 4 +model.layers.22.self_attn.o_proj: 3 +model.layers.22.self_attn.q_proj: 4 +model.layers.23.self_attn.o_proj: 3 +model.layers.23.self_attn.q_proj: 3 +model.layers.24.self_attn.o_proj: 3 +model.layers.24.self_attn.q_proj: 3 +model.layers.25.self_attn.o_proj: 4 +model.layers.25.self_attn.q_proj: 3 +model.layers.26.self_attn.o_proj: 4 +model.layers.26.self_attn.q_proj: 3 +model.layers.27.self_attn.o_proj: 3 +model.layers.27.self_attn.q_proj: 3 +model.layers.28.self_attn.o_proj: 3 +model.layers.28.self_attn.q_proj: 4 +model.layers.29.self_attn.o_proj: 4 +model.layers.29.self_attn.q_proj: 4 +model.layers.30.self_attn.o_proj: 3 +model.layers.30.self_attn.q_proj: 3 +model.layers.31.self_attn.o_proj: 4 +model.layers.31.self_attn.q_proj: 4 \ No newline at end of file diff --git a/model.layers.0.mlp.down_proj/data.pt b/model.layers.0.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..37b2e72ed55d02b1b7d4768f735062b9dfb10ac9 --- /dev/null +++ b/model.layers.0.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6aa9e4b39941e4e390b0957c5b4614e3e36f577d4b0be4eb05dfa121219159 +size 60556799 diff --git a/model.layers.0.mlp.gate_proj/data.pt b/model.layers.0.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..84fca07add7c0495f5c6d5661c819b70adb5b098 --- /dev/null +++ b/model.layers.0.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a87ff8c119c3a45703c2ca10a1d23158fb6172acabc37b6afea6a75affbc9f +size 60556799 diff --git a/model.layers.0.mlp.up_proj/data.pt b/model.layers.0.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..112c114e45f50f9ae64327dc8bd0901b9d698dcb --- /dev/null +++ b/model.layers.0.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef91108126e433801c55ec845d801b1f510e0e5b3612c5c73da2f358d9debcea +size 60556799 diff --git a/model.layers.0.self_attn.k_proj/data.pt b/model.layers.0.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a01a20a49c60a63d94e762d1d4861e2f59b2f3a --- /dev/null +++ b/model.layers.0.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69219628c4e06ef22ee516f0744f3c845b5eb2ef6b19e0566488d9dcda6beffb +size 4326911 diff --git a/model.layers.0.self_attn.o_proj/data.pt b/model.layers.0.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e0f7fd24cc444c2bf46dfa4c2a5f59444d475a9 --- /dev/null +++ b/model.layers.0.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25cd01037f67475ac9cfc02f79316cb734ad6315f3735cdab8dcb00df710f86 +size 17303039 diff --git a/model.layers.0.self_attn.q_proj/data.pt b/model.layers.0.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1a3f92e750a8866f5a14ee66035c7650e38b9f8 --- /dev/null +++ b/model.layers.0.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc37d678f205dc7572d5b45ea003564766621bc1d5e2d8991a2166bec541bbb7 +size 17303039 diff --git a/model.layers.0.self_attn.v_proj/data.pt b/model.layers.0.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb7360d2580ed56d31897b96ea0f7bac2ac0f0e --- /dev/null +++ b/model.layers.0.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4136b4f26f55f90133ffe450df9061d8cc929451a81e2e5ba327ca9fd15610a2 +size 4326911 diff --git a/model.layers.1.mlp.down_proj/data.pt b/model.layers.1.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b2a8e471ddaaf62d958a11626b170c6fcd713a --- /dev/null +++ b/model.layers.1.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f8506138944972ce1ce86e2874ed5b48043db3e916c29200640fc58cc9f1f80 +size 60556799 diff --git a/model.layers.1.mlp.gate_proj/data.pt b/model.layers.1.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c18ed5333500a69cc3b7cb68f8af844da4422fb0 --- /dev/null +++ b/model.layers.1.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28bc549fc51bde6275acc36d6a383334dfa48d6df621dfbf3a451729e2297550 +size 60556799 diff --git a/model.layers.1.mlp.up_proj/data.pt b/model.layers.1.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecd523aea8c79e365e157ffc4b78e7253a52321b --- /dev/null +++ b/model.layers.1.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:613cef1546c328228b2a3a7bdca0bb47ae61a1d8c37d865bc64f8a52ff82171e +size 60556799 diff --git a/model.layers.1.self_attn.k_proj/data.pt b/model.layers.1.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a39351c2b513305c7ce58995cec6cce0aac709 --- /dev/null +++ b/model.layers.1.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd28c601bed4c42b9ba24e8ee3ef6f5845595645cb0698f64497b022677109f2 +size 4326911 diff --git a/model.layers.1.self_attn.o_proj/data.pt b/model.layers.1.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a41dbd7d06c4053bec6cfd2c2a9f85b128824e3f --- /dev/null +++ b/model.layers.1.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3688c5140990d724b46fbc97ada1ade768f02c507d527fba0df105aa17c13c +size 17303039 diff --git a/model.layers.1.self_attn.q_proj/data.pt b/model.layers.1.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7e826bd46b089d53734ce4d0a9f90ddea540149 --- /dev/null +++ b/model.layers.1.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaad8244238fe5b18dff2a7ac969e8f1dbd5df412f929d51ffa60979326317b5 +size 17303039 diff --git a/model.layers.1.self_attn.v_proj/data.pt b/model.layers.1.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcd3398a928ed565da79f2976f51a0f9a09c06f2 --- /dev/null +++ b/model.layers.1.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7df87f6c9eb0ae98529beb7dc1373e468867e1687e9060edbcf0b7e8b79982f +size 4326911 diff --git a/model.layers.10.mlp.down_proj/data.pt b/model.layers.10.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8304d4d1a72c35bf351bb8ba0239267508b36a79 --- /dev/null +++ b/model.layers.10.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:243c19abfa02999c1d2ad49aa7dce2522417b4d8e16ecef2e8f32060abf6278a +size 60556799 diff --git a/model.layers.10.mlp.gate_proj/data.pt b/model.layers.10.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f563c56447a727bd5e830639fd1c8f795421c6 --- /dev/null +++ b/model.layers.10.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae86a1ac47c33ef20bbe828a112714843d5dec5be9f6b7f673fd693f13048578 +size 60556799 diff --git a/model.layers.10.mlp.up_proj/data.pt b/model.layers.10.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed475fb98e4e55f8bbd5130783ba7e581632d63 --- /dev/null +++ b/model.layers.10.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33cb27b2264cdf9422b7b7ab00b7ed0a6ae965e586bf7bda4249ba290c0f91f +size 60556799 diff --git a/model.layers.10.self_attn.k_proj/data.pt b/model.layers.10.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e38e72df59d31f7d7fa497e881b27ee3062f14c --- /dev/null +++ b/model.layers.10.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86677d3fa841674e0e79186783efb7e060c7b6f65412f56545dd4320879c569b +size 4326911 diff --git a/model.layers.10.self_attn.o_proj/data.pt b/model.layers.10.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..05348851b2e16109c2c9dc8077ce6e7f5adfeb3d --- /dev/null +++ b/model.layers.10.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308dbe77986e4f695c80b2ce5410a772916af810532ae7d5270bbdf72812b6b3 +size 17303039 diff --git a/model.layers.10.self_attn.q_proj/data.pt b/model.layers.10.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4a9112ec5c6b1b1b8901442a7ec18a5bd5a1486 --- /dev/null +++ b/model.layers.10.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b6baff34468e1bc0b26c01dfb276c7ed2feb3b104f1e9af8d009356f883bf6 +size 17303039 diff --git a/model.layers.10.self_attn.v_proj/data.pt b/model.layers.10.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf892d689718e92740a829c1db91eed7d1d20571 --- /dev/null +++ b/model.layers.10.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e4f4c879f587f50e6fd2f209f994fb5bfb347bf1acd21e3dd111cd824ea0ff +size 4326911 diff --git a/model.layers.11.mlp.down_proj/data.pt b/model.layers.11.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..aff4213b897340a7477f8afc7518985802560372 --- /dev/null +++ b/model.layers.11.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be3ed2fc6a78c20913e7610df54a2c17c6fe163257529205530a62db6f5219e6 +size 60556799 diff --git a/model.layers.11.mlp.gate_proj/data.pt b/model.layers.11.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..22bdd734ee2d1a57ce059a4ed3b5dd9433185ade --- /dev/null +++ b/model.layers.11.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da931c576c895e1a56e421c13a550306eebd531b93fb6a5e3be2342da7b531c +size 60556799 diff --git a/model.layers.11.mlp.up_proj/data.pt b/model.layers.11.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..222e33328aa3db2ca3ba9f346dd3bedb3cd904fc --- /dev/null +++ b/model.layers.11.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf34c29def6ea4d8164ab23fd6292ef3524e80bbb416fd66e56531343f93aede +size 60556799 diff --git a/model.layers.11.self_attn.k_proj/data.pt b/model.layers.11.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..68301a5cbce42af4250002dd0f9ae5e41504be00 --- /dev/null +++ b/model.layers.11.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61e19a09eafc2326c9b9645bb1ad51495607278aa8e276ca98da256ccd1adc7 +size 4326911 diff --git a/model.layers.11.self_attn.o_proj/data.pt b/model.layers.11.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fab234461cc27beeffade4ff3d0b4a7ce974bff --- /dev/null +++ b/model.layers.11.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c38d8e5e656603a2dbb983a2686cdad46212723ba784b778b83b824df5a6e55 +size 17303039 diff --git a/model.layers.11.self_attn.q_proj/data.pt b/model.layers.11.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..81205a5ba846cbdfa90c9bddb054fdd6e7ed44ba --- /dev/null +++ b/model.layers.11.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec66fa51b9bd8df856565a07a648a93b37700ea0151f2b45a68194b4bdf857cd +size 17303039 diff --git a/model.layers.11.self_attn.v_proj/data.pt b/model.layers.11.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cefd9053742aae404bee39d2bd33ff75ff445a5 --- /dev/null +++ b/model.layers.11.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a458551e4f3e02f05a8f1af0659332235c68c065903be4288800a395b97447e0 +size 4326911 diff --git a/model.layers.12.mlp.down_proj/data.pt b/model.layers.12.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..39832010a0b5eaf2f341861c95b2f853401fd93a --- /dev/null +++ b/model.layers.12.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c76878012a75b2861349157727dbdad88c8970663f37115b116c2d61430b82 +size 60556799 diff --git a/model.layers.12.mlp.gate_proj/data.pt b/model.layers.12.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f3cc0a477f25628136f643708f58a7b2b571138 --- /dev/null +++ b/model.layers.12.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f3cb4e9357e8cb2507126857b7c63fd06b793181e9b44e56c167b22782a741 +size 60556799 diff --git a/model.layers.12.mlp.up_proj/data.pt b/model.layers.12.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b84e8141f595aabb46302d16e674d1f9238295 --- /dev/null +++ b/model.layers.12.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c3cacd78883f82e9676a6d62a574a39a65d8459354aa1b08cde24e636470224 +size 60556799 diff --git a/model.layers.12.self_attn.k_proj/data.pt b/model.layers.12.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7adab9e302ba1cc548f9c45dfa35d120e1108b0 --- /dev/null +++ b/model.layers.12.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce15c46f5e7a65d351a14ff288ec70c51c873c4ab050e4ccc81f2e44ed1651a4 +size 4326911 diff --git a/model.layers.12.self_attn.o_proj/data.pt b/model.layers.12.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a0540e42d83050890d0d17f85518d654266d59 --- /dev/null +++ b/model.layers.12.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d1a16eb11665a8cfc46b448ff209cd8aa3e40191e52693b84e7d4bea9f6e0e +size 17303039 diff --git a/model.layers.12.self_attn.q_proj/data.pt b/model.layers.12.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3cc01cb3f1782182cd9fc83e347ae3c156a7a9a --- /dev/null +++ b/model.layers.12.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cef05f7c22632f5af5e120700891d4f3480b6cfd7321d27bb5e27d764936923 +size 17303039 diff --git a/model.layers.12.self_attn.v_proj/data.pt b/model.layers.12.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b4078500f7f713d5c31b6652c15c34840e470fc --- /dev/null +++ b/model.layers.12.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f5d93830d5d103f9089ebcd7fe12a937341944e018d13263acd971404f16fb4 +size 4326911 diff --git a/model.layers.13.mlp.down_proj/data.pt b/model.layers.13.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e0c5ac7cc642087717752240ff9c96a1b973dfd --- /dev/null +++ b/model.layers.13.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21285378eb6996927308669a95117cd7d695dd8fcd5ae5169eb1696ae180682f +size 60556799 diff --git a/model.layers.13.mlp.gate_proj/data.pt b/model.layers.13.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55db0ea8eec2e0e7537d1429ad2961a6b058eb7 --- /dev/null +++ b/model.layers.13.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f44023613bc05892cd189615b29371a0ff987f5b1da45ff8b7f175b5ca98d7 +size 60556799 diff --git a/model.layers.13.mlp.up_proj/data.pt b/model.layers.13.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5262ac2393e6de06085db58d6a97e235680b6f88 --- /dev/null +++ b/model.layers.13.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c18145b24457bc01e766b3c32edae9d3dd73733891a9888212682d8c3a2007d +size 60556799 diff --git a/model.layers.13.self_attn.k_proj/data.pt b/model.layers.13.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..0756de9a7f2622b8103118f466c98cbceb4983e0 --- /dev/null +++ b/model.layers.13.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588f53f9d02bd00c739e70d42c93d8a483e83e713af60e3ac51a386537a690c4 +size 4326911 diff --git a/model.layers.13.self_attn.o_proj/data.pt b/model.layers.13.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..33f356f047897e29d2130be7f6294f30171fa3c5 --- /dev/null +++ b/model.layers.13.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adfdeba39e52806bf0ce4f42e0216ca19ad306b5b89e267dfb5d0618712fab79 +size 17303039 diff --git a/model.layers.13.self_attn.q_proj/data.pt b/model.layers.13.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4fe4367239317e39821b19da5a0b8424f5f6447 --- /dev/null +++ b/model.layers.13.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab47c49f09963f5e43777386186791d3f4b269b6f709329ec4fe1b16bd28bd7d +size 17303039 diff --git a/model.layers.13.self_attn.v_proj/data.pt b/model.layers.13.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3de52a29e442a6868552695806ffba0a6fd4d677 --- /dev/null +++ b/model.layers.13.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d548dcbde5cda08a6ae29c4d42c5fdbcba27090821ad99462982391cf557f6ef +size 4326911 diff --git a/model.layers.14.mlp.down_proj/data.pt b/model.layers.14.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..76b7536835d5760c248c2814a4b65805e2d59666 --- /dev/null +++ b/model.layers.14.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f64d63e1e5a09f17838fe81206e115a01417c75758587314cdd5e7f67b27085 +size 60556799 diff --git a/model.layers.14.mlp.gate_proj/data.pt b/model.layers.14.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f78e184eacf8482db332c838102e1d808b84f9b --- /dev/null +++ b/model.layers.14.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0ff883c0324cb5157be7aec14cfbc0810b6752fc966222cbf2de97d0f73e52 +size 60556799 diff --git a/model.layers.14.mlp.up_proj/data.pt b/model.layers.14.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f59ec6245fb17a4e55be00be72beae4ff5cb4a3 --- /dev/null +++ b/model.layers.14.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83692b782426973305cb4b5da528d8ef90d779fa99fc3bbef53cc9b57b348e3f +size 60556799 diff --git a/model.layers.14.self_attn.k_proj/data.pt b/model.layers.14.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0b6dd3642ff2d60f4a7d03aa340bbfd5afa1843 --- /dev/null +++ b/model.layers.14.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268c94b7f0ef408b325f2353079a08cf00ce9e460188f503bc4ea601de39452d +size 4326911 diff --git a/model.layers.14.self_attn.o_proj/data.pt b/model.layers.14.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..332b4dfe697ebe2dc6736239f234fdfc21c82655 --- /dev/null +++ b/model.layers.14.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c30318b90362c225c276e829e84ac6084e9f1b30829a2bbdcc56f80409c724e0 +size 17303039 diff --git a/model.layers.14.self_attn.q_proj/data.pt b/model.layers.14.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c7b6053b198724107359944fad7fb0739492496 --- /dev/null +++ b/model.layers.14.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92192bc558573d8fa2932c8dcffe6357124b634d36de6f1c5e23763cf72b8e0b +size 17303039 diff --git a/model.layers.14.self_attn.v_proj/data.pt b/model.layers.14.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cecb9712c17ae92dc8f14dbac08365fd6a38b30 --- /dev/null +++ b/model.layers.14.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64152d48091cec9d1a205b0406d470c09e4aa44a0fc722932527fca6a3e3b06a +size 4326911 diff --git a/model.layers.15.mlp.down_proj/data.pt b/model.layers.15.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e9b00f78f0930801e8c135f3b2355725b8d090c --- /dev/null +++ b/model.layers.15.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e012c71f596ed7d169b6e6b6005b2b614667222d1ad17f9e7aaf0952bf658e8 +size 60556799 diff --git a/model.layers.15.mlp.gate_proj/data.pt b/model.layers.15.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f78fec0a4b75673df0fa2b15ff9127c9ea6c707 --- /dev/null +++ b/model.layers.15.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25080b898e97a5b7829aff000a179afb4faec29ad053e5cd2b0a0d1552dc1165 +size 60556799 diff --git a/model.layers.15.mlp.up_proj/data.pt b/model.layers.15.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f8b98ae40b628e783cedc60480274f59f7cca2 --- /dev/null +++ b/model.layers.15.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b229d27eebe26f3423a1e59528fcfd38e3b6ad3c670db1fd2027442007aab894 +size 60556799 diff --git a/model.layers.15.self_attn.k_proj/data.pt b/model.layers.15.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e77bdf02b24ea0d81f2e7500990ed7d8ef209ede --- /dev/null +++ b/model.layers.15.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e9ecaad4bc22dc34e2b03430aa4e87e1162c27b102ac948c9ba8ca3f584888 +size 4326911 diff --git a/model.layers.15.self_attn.o_proj/data.pt b/model.layers.15.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8952cec7b2596ec3c932e2be398bc5f2d0afa558 --- /dev/null +++ b/model.layers.15.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c386fba8e9877ae8824dd7a0ed4d7b29230902909ef1308c5fcfab8309abd4 +size 17303039 diff --git a/model.layers.15.self_attn.q_proj/data.pt b/model.layers.15.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..49ae57ac6d2eca33950e8391966ed1a1f52a452e --- /dev/null +++ b/model.layers.15.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d29c9c67a40e5a7a25ab09e15b1dfc67036ddbfb9f7220ebb5e52b34c44f2f5 +size 17303039 diff --git a/model.layers.15.self_attn.v_proj/data.pt b/model.layers.15.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c242704c197ec32d2070f35ba641279d7a6ee1d1 --- /dev/null +++ b/model.layers.15.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df72001cbd124229645485882a9d6a8c73b48ff3de637e37e568315cf74be88 +size 4326911 diff --git a/model.layers.16.mlp.down_proj/data.pt b/model.layers.16.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..762ab20e7959bc059829142c9a14698bc0eabd03 --- /dev/null +++ b/model.layers.16.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137533d4bdeff0b92e57e095edc512b83cce7c5cbe5a22440f04bcc4ca806f69 +size 60556799 diff --git a/model.layers.16.mlp.gate_proj/data.pt b/model.layers.16.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..04e8293a4a5836e9b92826f36ad0b0b4084b6f10 --- /dev/null +++ b/model.layers.16.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50735e3dd288f7a79e8ccac1cf7cc03193860bdf59e6d42d8cd7f801f5b27e0b +size 60556799 diff --git a/model.layers.16.mlp.up_proj/data.pt b/model.layers.16.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d33acff0f7b5d662b6e440c389055c272ef5914d --- /dev/null +++ b/model.layers.16.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f6074c1f3c917aa41b43532a482de7f4d4b67df70494594b6d091e5a68409b +size 60556799 diff --git a/model.layers.16.self_attn.k_proj/data.pt b/model.layers.16.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b75bd3353234465f5b2f065037ac3d4638d0bf4 --- /dev/null +++ b/model.layers.16.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d74dcaa0c5b025c6ab3a385ce1b6745364cc89cd27b0e7453ed4a104c307ce9 +size 4326911 diff --git a/model.layers.16.self_attn.o_proj/data.pt b/model.layers.16.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dcfd7e6c228d6d6d6c1f2b5c652b9aadd1e2042 --- /dev/null +++ b/model.layers.16.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e2282f7e448a1aaa51f08b51e730b5ebc9167ee508ed700a2ad206c0b3effc +size 17303039 diff --git a/model.layers.16.self_attn.q_proj/data.pt b/model.layers.16.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2985e4a5fa5afbe3ddf37aea261d1b501caaaed --- /dev/null +++ b/model.layers.16.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8adae7ce21e08e11739e861dad17a25047b8d9438a5ea1fcb130e722505aa6e +size 17303039 diff --git a/model.layers.16.self_attn.v_proj/data.pt b/model.layers.16.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..571e37ae95e94a404b67a42eb6f5a244611df062 --- /dev/null +++ b/model.layers.16.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d413250b7c228c850c1a47e477198daa9596b645a570a58f00a52e55232a2254 +size 4326911 diff --git a/model.layers.17.mlp.down_proj/data.pt b/model.layers.17.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ea9045c4e9d186667f9acc10530e1e686354757 --- /dev/null +++ b/model.layers.17.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954aa6cbfe0bd2dec4dd38e4962d9e2242fb5b1508d261e9e778c546d7eae01d +size 60556799 diff --git a/model.layers.17.mlp.gate_proj/data.pt b/model.layers.17.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc357bf2b5e0f1d525755987eb80e9839354271d --- /dev/null +++ b/model.layers.17.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c004923aba55d34939b8426f5cf2ab8b63e2e4185ecc8c037bec8584c392074 +size 60556799 diff --git a/model.layers.17.mlp.up_proj/data.pt b/model.layers.17.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a6594d82935e8e3d233cc0c32486243e0fbf118 --- /dev/null +++ b/model.layers.17.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3028d7c80b3cfcf3a981b130b6b32c1ed113181140674a0d9d5f87735b5171eb +size 60556799 diff --git a/model.layers.17.self_attn.k_proj/data.pt b/model.layers.17.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a642aeb0de38c4c0443ae29f69d82adbab9aff4 --- /dev/null +++ b/model.layers.17.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf670159b9c8784bac39bebdd057469e0d5c7ff8e6b1880631e10bd24194f331 +size 4326911 diff --git a/model.layers.17.self_attn.o_proj/data.pt b/model.layers.17.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..2258553dd5aae754e8e0f05df74b62045c758fcc --- /dev/null +++ b/model.layers.17.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42abe35ec12203b6c47d70d9d88cc1d5daa0eae8586d9bd948f90aa4724decff +size 17303039 diff --git a/model.layers.17.self_attn.q_proj/data.pt b/model.layers.17.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba00831a06a106d496043ad28c8ff6877a83167 --- /dev/null +++ b/model.layers.17.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ad1c77c791d32e1027d45df1616003139230832708828e3908356443f45431 +size 17303039 diff --git a/model.layers.17.self_attn.v_proj/data.pt b/model.layers.17.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..203c90799290354e76d8da9a704452d41dc7129f --- /dev/null +++ b/model.layers.17.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d0e2110efd747e8d043cca8e53ba9298b62af257ec46c5ac7f78a794cb26d6 +size 4326911 diff --git a/model.layers.18.mlp.down_proj/data.pt b/model.layers.18.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b4ffebd404a1c851adfcd569aa8669a6b4cc4bb --- /dev/null +++ b/model.layers.18.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc27f6d1f6ebc31f107328e9093d1d4d5dfd4b51e95959c808adb5ff60b07a01 +size 60556799 diff --git a/model.layers.18.mlp.gate_proj/data.pt b/model.layers.18.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eca7e69dc5d712163e3f765a33cc2f33632f04a --- /dev/null +++ b/model.layers.18.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05933ce929d6608d27f5af9ea7a8287aefaa7ac0aa9ca1858014f46adc5e7d9d +size 60556799 diff --git a/model.layers.18.mlp.up_proj/data.pt b/model.layers.18.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc47761dec91d3f8848c3235c7d56f77539fee34 --- /dev/null +++ b/model.layers.18.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f3c5c0b892f2c42808a16f5b443ab54d5fc70d8309f9004934cbc8414613ba8 +size 60556799 diff --git a/model.layers.18.self_attn.k_proj/data.pt b/model.layers.18.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a606fd79192d81e141e0656b71c0dfc9dec03f5a --- /dev/null +++ b/model.layers.18.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c270a9865c567adb071d4ac66055bd0baba4729d2f5f5dd107a79497b18cc87 +size 4326911 diff --git a/model.layers.18.self_attn.o_proj/data.pt b/model.layers.18.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..25cfc73427093c88a5fd77a20cba83a088f55670 --- /dev/null +++ b/model.layers.18.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae2524a30bf79fc245cbd7c799311fec35defee6ab31f0f96d33cb031373fa9 +size 17303039 diff --git a/model.layers.18.self_attn.q_proj/data.pt b/model.layers.18.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2bfa78b843e2f9f71c35d6d2b98ec4b525306d7 --- /dev/null +++ b/model.layers.18.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d64c7dcbfbc26601c7bf85a287d969c5df5f93ff3ae3c0c9b512d599689e3e +size 17303039 diff --git a/model.layers.18.self_attn.v_proj/data.pt b/model.layers.18.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8ecefd372739b4cecb0a2d40d43d380555455d --- /dev/null +++ b/model.layers.18.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba05ce445ce5251f81c8f1b6abd1432dcde51248d76126466eba252890ce73a +size 4326911 diff --git a/model.layers.19.mlp.down_proj/data.pt b/model.layers.19.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3821e099b4b73dc92685b1316101c8b46a200edb --- /dev/null +++ b/model.layers.19.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc677d1529b2cc0313d87816461ad84f22febf0cce6cc085eba83685498a674f +size 60556799 diff --git a/model.layers.19.mlp.gate_proj/data.pt b/model.layers.19.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5dddd0ee4ba5b96813514d18302293f8b3deab --- /dev/null +++ b/model.layers.19.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e6758f296ed10d079d79b3b92dc53c4727a3621c6e17e472e548d65581c34d +size 60556799 diff --git a/model.layers.19.mlp.up_proj/data.pt b/model.layers.19.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3f29ffc87dced37c452b97e5223c4cfd49ae87a --- /dev/null +++ b/model.layers.19.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce366852ed336eeee632c7e1350527810911bb9e3f70336224a3748e68ad43d +size 60556799 diff --git a/model.layers.19.self_attn.k_proj/data.pt b/model.layers.19.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a6152a67696b9c061af233323262ff6fc958109 --- /dev/null +++ b/model.layers.19.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05a566c0be32ac1e7bc1627d9f3d80bceffd6b43b0a82256caf536ff5364494 +size 4326911 diff --git a/model.layers.19.self_attn.o_proj/data.pt b/model.layers.19.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f48492f9bdf00a919c494ee2459b58a66a2945 --- /dev/null +++ b/model.layers.19.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ac644ae5b4813b6514284fa49a354daeaa5ebda0a8467429309dd5e2b6e5de +size 17303039 diff --git a/model.layers.19.self_attn.q_proj/data.pt b/model.layers.19.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c2ae17e7d9c91ff21c095799d02cb1dbe2ab79 --- /dev/null +++ b/model.layers.19.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8abf6625602f0cc476324bd1fbd95ab8d8c983553872d44562cfcc5aa60e3fc +size 17303039 diff --git a/model.layers.19.self_attn.v_proj/data.pt b/model.layers.19.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5b77644adc3e120996a7a7cb72026f40a1d0333 --- /dev/null +++ b/model.layers.19.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fed95bef239a47963992ca373346d04a122e0d80fcf195f83c9b595d17b250c +size 4326911 diff --git a/model.layers.2.mlp.down_proj/data.pt b/model.layers.2.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..59afc17ab3b30cb402592115312a049a276adc4d --- /dev/null +++ b/model.layers.2.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7776778663d988bfced1e9f302a2a773584178dacfb6453f65c953d73e091e7 +size 60556799 diff --git a/model.layers.2.mlp.gate_proj/data.pt b/model.layers.2.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8d7c31f25b5135805881a495de8ea8bb1521611 --- /dev/null +++ b/model.layers.2.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39973e93113c126bf18a962989ea573c1f170080812dd09ea0b1584b39505919 +size 60556799 diff --git a/model.layers.2.mlp.up_proj/data.pt b/model.layers.2.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..6866507c838cb503afb6b2bba6292f251ce237fa --- /dev/null +++ b/model.layers.2.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5fcec15ab613cbae332f9907cfeda34383034181841cc1d905e8be99a0cf1f +size 60556799 diff --git a/model.layers.2.self_attn.k_proj/data.pt b/model.layers.2.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5776453faef571d671694727faea24939801469 --- /dev/null +++ b/model.layers.2.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7e8314d38bef450d5808968c0f01bd3f011d85b23fdae1f3df587a0d8bf905 +size 4326911 diff --git a/model.layers.2.self_attn.o_proj/data.pt b/model.layers.2.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4cec0e78496260cc0ede2337f0af0661ece86e --- /dev/null +++ b/model.layers.2.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e277203d6316bd78cbd091c7c31308a437c3e178432f2bf6e6560f28382b84d9 +size 17303039 diff --git a/model.layers.2.self_attn.q_proj/data.pt b/model.layers.2.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9217b3807237d3ff7329198f5329c910f1a261b3 --- /dev/null +++ b/model.layers.2.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833d8ceb580a61844d5b944be0d00bc21c65505255013e63688ceea1f5c0c31d +size 17303039 diff --git a/model.layers.2.self_attn.v_proj/data.pt b/model.layers.2.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b6ecfb5c1d674905a18f58637abe6c698a2a237 --- /dev/null +++ b/model.layers.2.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e39b910734cbababb5e34ab135990b2a85251fd60795f65882c2f405b601722 +size 4326911 diff --git a/model.layers.20.mlp.down_proj/data.pt b/model.layers.20.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6a93e962845ae340494d549ae1286766511cc36 --- /dev/null +++ b/model.layers.20.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa75a5e19cd87089ce3eb105e53ef4d97cd8e391a7e4b48911249fcbffc302b +size 60556799 diff --git a/model.layers.20.mlp.gate_proj/data.pt b/model.layers.20.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8faf0769d282958f9ed7e9459c44dec5f986f4a --- /dev/null +++ b/model.layers.20.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc41fa1f8c964cc6af131daaf843c2b579ea365befc6a00e096a2a75d946a2f +size 60556799 diff --git a/model.layers.20.mlp.up_proj/data.pt b/model.layers.20.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2d43a46fc1ce066b78f029de48286a03b9bbfb --- /dev/null +++ b/model.layers.20.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477d24e771768e7d8fadf767144e888ee86a9ecf71db84db0680755ca38154f2 +size 60556799 diff --git a/model.layers.20.self_attn.k_proj/data.pt b/model.layers.20.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..907c6828a686e78371f8a9aa67f794da0f10e2a2 --- /dev/null +++ b/model.layers.20.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08395c8765bf1c5dc26750d2a6d90d58366b3b5cf2c3c98b5dd0ff62e83b6fdc +size 4326911 diff --git a/model.layers.20.self_attn.o_proj/data.pt b/model.layers.20.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe8d09265ae07ee755b1b50c4b69a547c583ee87 --- /dev/null +++ b/model.layers.20.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b92d7ef2cf20dab18abf288f49fc60e8a451a19b72bba190ab9f5db2a6374c9 +size 17303039 diff --git a/model.layers.20.self_attn.q_proj/data.pt b/model.layers.20.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cd3ecc3f548919d87fbfa7102d43d6d6f96957d --- /dev/null +++ b/model.layers.20.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d5101bcf021e1d2b894cac462291723b0c12cff4342a6e2c98c7e195a5fe73 +size 17303039 diff --git a/model.layers.20.self_attn.v_proj/data.pt b/model.layers.20.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed8d17ce032419cce285b68d383bb35e0de95be5 --- /dev/null +++ b/model.layers.20.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5241d65d12c01c1b330f35246e6c8bdc0a0cbaf32ea3f23824b468d1f5e9053f +size 4326911 diff --git a/model.layers.21.mlp.down_proj/data.pt b/model.layers.21.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..281622814ed3331e3b027c8c1bfc0c2a8d25adf1 --- /dev/null +++ b/model.layers.21.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5ad7bc2106202ce2f3b4ed17bc5c8fc444fedd33234e985beca5c02648b59ea +size 60556799 diff --git a/model.layers.21.mlp.gate_proj/data.pt b/model.layers.21.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0cd7922dfb39f5c873e3f0ddcb9995e0959b26 --- /dev/null +++ b/model.layers.21.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d50abe7020725fbcc4f2d8729307dd48b74b8553d70223e48ce8387e6e7a12a +size 60556799 diff --git a/model.layers.21.mlp.up_proj/data.pt b/model.layers.21.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f507fcf96424e0013df5223a7dc744b635747cf1 --- /dev/null +++ b/model.layers.21.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b4c40d6124a111dbe6c818d09fbaa7b6a4561481ea3c87c2246fc3db921367 +size 60556799 diff --git a/model.layers.21.self_attn.k_proj/data.pt b/model.layers.21.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55223c8fd01acf3ac3123657c80a4f0c2e807a7 --- /dev/null +++ b/model.layers.21.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2283596c105367b19c2ba1ded6cbafffcacee64046b410ad1b5b2fb0d6c9bc5 +size 4326911 diff --git a/model.layers.21.self_attn.o_proj/data.pt b/model.layers.21.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d98bf04fdf3d6e80f05797a8c3d51a9c72cbafd4 --- /dev/null +++ b/model.layers.21.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08310c57d75b0c5da2d6bb68499130f83814ae7877723062c29b9d17810e9f3f +size 17303039 diff --git a/model.layers.21.self_attn.q_proj/data.pt b/model.layers.21.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3a45095794b0e32fd9763682e102fc8bc5ac16 --- /dev/null +++ b/model.layers.21.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da20e72568cb52ca118324694ed3a92def2ddcb4cfcf82597890637568898dd4 +size 17303039 diff --git a/model.layers.21.self_attn.v_proj/data.pt b/model.layers.21.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9fbacdb985b01f5f4a0829f2b4f636e5c313211 --- /dev/null +++ b/model.layers.21.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55aa4b83f4d405701ff481ac88c5572279b8dc6a2734f76b26a968c0a54f40fa +size 4326911 diff --git a/model.layers.22.mlp.down_proj/data.pt b/model.layers.22.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c393b747b6e733af36a0635b643fafc581054451 --- /dev/null +++ b/model.layers.22.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d133d04f5d994bdc708463635d1a673182bf162eea1871e09e8296ed2abf3eab +size 60556799 diff --git a/model.layers.22.mlp.gate_proj/data.pt b/model.layers.22.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef2325f61979a4bf7d1c466bda5425fe58acee80 --- /dev/null +++ b/model.layers.22.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f176a00e25416341a528b8f2815b81b6661012c3054e5241a6a98fd88a98354f +size 60556799 diff --git a/model.layers.22.mlp.up_proj/data.pt b/model.layers.22.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..36c5526c1679bcfaf6a37c9d432ed1046a001f15 --- /dev/null +++ b/model.layers.22.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be504ad58db03681c8893587ec1c0d862db90b47deff27476b5382344540fa8c +size 60556799 diff --git a/model.layers.22.self_attn.k_proj/data.pt b/model.layers.22.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..80db40db36fadd56f5aeb349b7da31cef29b2bae --- /dev/null +++ b/model.layers.22.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f321f4b36d41cb1272af2d7adcc7c6ff1c61e6f20582db9f828e36de067a7433 +size 4326911 diff --git a/model.layers.22.self_attn.o_proj/data.pt b/model.layers.22.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8798674e327a639c39a8391a19e592b7610c633 --- /dev/null +++ b/model.layers.22.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee01076330bae70818f752b8b112d41f983c1890cae0fd3965e6fcc9508b7521 +size 17303039 diff --git a/model.layers.22.self_attn.q_proj/data.pt b/model.layers.22.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71bac3758403ab14e4d8ed9eee07334ae57d6cc --- /dev/null +++ b/model.layers.22.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5a28d98796a6e5edad1dd67bc5a99f1f99a303dd645c387fca5950638af2f9 +size 17303039 diff --git a/model.layers.22.self_attn.v_proj/data.pt b/model.layers.22.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8a2bae3ad8ba2b73b0f19cee7fecc71b1c37805 --- /dev/null +++ b/model.layers.22.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d647c941cd9513ba8722a7e3b88c88e3bd9bcc99af0c43a83ed6224df92db3 +size 4326911 diff --git a/model.layers.23.mlp.down_proj/data.pt b/model.layers.23.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..cafdba9a1e3e3609abed9f11b748f63db31b6f8d --- /dev/null +++ b/model.layers.23.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af76426ca53a720fab6c12708299434e99e53d9734a13dce6d683acc4f50012 +size 60556799 diff --git a/model.layers.23.mlp.gate_proj/data.pt b/model.layers.23.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b56934408ef2077b262e06ea5d336dd2790473a --- /dev/null +++ b/model.layers.23.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c78d5476fbcb3277c2891c04212d1c1946315ef9f3aa6c6a9c3338e3cd89e9 +size 60556799 diff --git a/model.layers.23.mlp.up_proj/data.pt b/model.layers.23.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7492da5938215161d22e6aceca0992420eb9688e --- /dev/null +++ b/model.layers.23.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4842d1db4a56ee93e4a3c20be66b71e11c0d19ec5faf71d1afa451da844fba6d +size 60556799 diff --git a/model.layers.23.self_attn.k_proj/data.pt b/model.layers.23.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f25f770b05f60b80634e1319484ea3096d00b795 --- /dev/null +++ b/model.layers.23.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f7247937806a47b1903e8fe62dcf779bb4541fecea54b2150fe59215fb37f8 +size 4326911 diff --git a/model.layers.23.self_attn.o_proj/data.pt b/model.layers.23.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..373c396dd648a4e47edb1e8c918da0e8794ece90 --- /dev/null +++ b/model.layers.23.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e476efeb8a66a8d874ce0e34afeb5ee3c6e32ee19c2c74ad30eeaf0055e596 +size 17303039 diff --git a/model.layers.23.self_attn.q_proj/data.pt b/model.layers.23.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d7d901bec3b03ff3cc71c9243b2461a989899a --- /dev/null +++ b/model.layers.23.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d9cc4e7231fbc584de5af6d710d3025536f20a740ad19b660bf4e9258df95f7 +size 17303039 diff --git a/model.layers.23.self_attn.v_proj/data.pt b/model.layers.23.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7c8cbe091d8cf7cc09fda27aa310180fe00e72a --- /dev/null +++ b/model.layers.23.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f965891ae0d3c1e31cae7e6a1b6df995966ef4065a72eb02e62b606a3aa66a +size 4326911 diff --git a/model.layers.24.mlp.down_proj/data.pt b/model.layers.24.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e522baf60d473033aa892c59dd1227b88288ee30 --- /dev/null +++ b/model.layers.24.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a2ccd2b4ce64546037fc3cdbcf1d672dba24fe16750f639de7ffc35debb15d0 +size 60556799 diff --git a/model.layers.24.mlp.gate_proj/data.pt b/model.layers.24.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..670d1de2c382773be2fcbd89fec26306783e35ea --- /dev/null +++ b/model.layers.24.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2c1658261c50704ed31eacc6c9714389a0cd9cd3c54046806ae1a64444bc58 +size 60556799 diff --git a/model.layers.24.mlp.up_proj/data.pt b/model.layers.24.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e695899f32e442b54039c6e0bee5626fc40919b --- /dev/null +++ b/model.layers.24.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd899c817be254d0601a0b7de1aeacad7d6fdad694fa2472e210d433cd892a04 +size 60556799 diff --git a/model.layers.24.self_attn.k_proj/data.pt b/model.layers.24.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c70945c60d5343a7c6bdbe1cbc5e9227bf63bd15 --- /dev/null +++ b/model.layers.24.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8272ad7769c1321d59fcc974c005b14bf4a0fb4d1db64fb578aad6375a0b9c79 +size 4326911 diff --git a/model.layers.24.self_attn.o_proj/data.pt b/model.layers.24.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..04379ab84ff6a75a1feb56e7e6f399b5a9a4e591 --- /dev/null +++ b/model.layers.24.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa944be245c7e97b9b86e58ffeb87dc6f431469c9b293ed9ba5eab780125fe3f +size 17303039 diff --git a/model.layers.24.self_attn.q_proj/data.pt b/model.layers.24.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..61044e1b4b7d6bb8b059a65eef8e4f049efd05ef --- /dev/null +++ b/model.layers.24.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a704bfe729c22c8bdd08979ecd0ef7a8b3181782d7673aab5124e123a1b2b0 +size 17303039 diff --git a/model.layers.24.self_attn.v_proj/data.pt b/model.layers.24.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b2079c8b1ed04d2deaaae61382e11c95e4c7b6c --- /dev/null +++ b/model.layers.24.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7375191b81d809538417430118737ce4a4a72c5572cbebef3c3accb892c2186 +size 4326911 diff --git a/model.layers.25.mlp.down_proj/data.pt b/model.layers.25.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a16c213c70a39324e8eefcef645473e6c38c93b6 --- /dev/null +++ b/model.layers.25.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3051af47586f4902e1efd2845a5a04f5ae10ba75c3fe9d3790a4d178c86a9ca2 +size 60556799 diff --git a/model.layers.25.mlp.gate_proj/data.pt b/model.layers.25.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2de8e8b90c226a5bc7e8ff3b7f116959c6640ea --- /dev/null +++ b/model.layers.25.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ed007f106102fa1ce8b737b6c7dea0ccb7dcf507fdf5cd014b35cc83e9b217 +size 60556799 diff --git a/model.layers.25.mlp.up_proj/data.pt b/model.layers.25.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3faf75163509d3f334f4679a999ae23dde34d5d4 --- /dev/null +++ b/model.layers.25.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192e049261ad8e1ed58b16df6d333d14fb7bad61d7301adf3f05cff48ad95842 +size 60556799 diff --git a/model.layers.25.self_attn.k_proj/data.pt b/model.layers.25.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ac91a74fb8444329726316d8d9c38f76128f7c --- /dev/null +++ b/model.layers.25.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edced44a7cd3083d0b9d0830f5c5c11e49f647a92ad7c498bd15d139731b096e +size 4326911 diff --git a/model.layers.25.self_attn.o_proj/data.pt b/model.layers.25.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..50178e646fb4df5cdfd06a518017625332478d34 --- /dev/null +++ b/model.layers.25.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3aa3a694d20873509d46f1ff4112506e00d1eb2d7e3f9dfbaa88ca4b7474207 +size 17303039 diff --git a/model.layers.25.self_attn.q_proj/data.pt b/model.layers.25.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..08c8af3254775a7e612918f8b3496574891c5a67 --- /dev/null +++ b/model.layers.25.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af97a7dab264967951180bedf1333d69a6781a06f404fb018000201558807eb4 +size 17303039 diff --git a/model.layers.25.self_attn.v_proj/data.pt b/model.layers.25.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5b6db32c30b61b05f196a911af34bd31ff6d40 --- /dev/null +++ b/model.layers.25.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65eecaf23b96dee92471bc1d1b91da49e542cefffa32d48f025d7c261e2fb582 +size 4326911 diff --git a/model.layers.26.mlp.down_proj/data.pt b/model.layers.26.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..53bb76ff15f8374701014868ee39d91c0364257f --- /dev/null +++ b/model.layers.26.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d8c1e0332c54cca6ac349b02b19d7face68c1733077ba7ebe72a29d6a2b161 +size 60556799 diff --git a/model.layers.26.mlp.gate_proj/data.pt b/model.layers.26.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f69d3acd761fed13f43cf77dbfc76bd6d2202cd --- /dev/null +++ b/model.layers.26.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808e5594bcf056c0196b7a684f893c76e4be6f5a630d2760e1a9efceed65878d +size 60556799 diff --git a/model.layers.26.mlp.up_proj/data.pt b/model.layers.26.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3460f2a35e5ab7ec49913d68555008b6ffd3e454 --- /dev/null +++ b/model.layers.26.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86623bd4dcaf3daa30bab1f9ffe644ee5ba74f2153dc77164ac590606307f432 +size 60556799 diff --git a/model.layers.26.self_attn.k_proj/data.pt b/model.layers.26.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..303b0a87c9ad08e211ff03b0d1680ea5b088b40e --- /dev/null +++ b/model.layers.26.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d7cbdf20d9f1a50320c6ee992ae0c43780586921b37c5bb6aff5b12bf9468c3 +size 4326911 diff --git a/model.layers.26.self_attn.o_proj/data.pt b/model.layers.26.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..083a5ed1d7d5d9fe3fb694d45db9f62f93b730a9 --- /dev/null +++ b/model.layers.26.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ced9eed764ddd5c345cc227a5a024b37c26141108121ca711c8351b64b43ced +size 17303039 diff --git a/model.layers.26.self_attn.q_proj/data.pt b/model.layers.26.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bcbc17e86add15ccb301869859ab695437cffb1 --- /dev/null +++ b/model.layers.26.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f27371418d03c401c28201876c203c96294dddd9faee11febefc278bbd95bf7 +size 17303039 diff --git a/model.layers.26.self_attn.v_proj/data.pt b/model.layers.26.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..be1a446e4113cc4c8dfb41d3e56e89eefb9bf074 --- /dev/null +++ b/model.layers.26.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d986f40eba96b059342d02e66e584db931904d22a75c09f60de2f2084e9ea667 +size 4326911 diff --git a/model.layers.27.mlp.down_proj/data.pt b/model.layers.27.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..053b1188856e154f412d733687abedd098e74331 --- /dev/null +++ b/model.layers.27.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0060ca57458420876b16b16656b2e852dfd1cf99013ec42e61c76a704e6077e2 +size 60556799 diff --git a/model.layers.27.mlp.gate_proj/data.pt b/model.layers.27.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c85d3d090a09e59e0e581d7890715488f743ae1 --- /dev/null +++ b/model.layers.27.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abbd49d9cec2b08858d8f285d36a07209e86fe9ed8a87ec559cfd3295e9b87b1 +size 60556799 diff --git a/model.layers.27.mlp.up_proj/data.pt b/model.layers.27.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa7789e86e598590c999c31f6c2da83e7701b44 --- /dev/null +++ b/model.layers.27.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c88da6d64932feef2c6be8e3fc00c0801d035be2b95178bf5a324f97f0d31f7 +size 60556799 diff --git a/model.layers.27.self_attn.k_proj/data.pt b/model.layers.27.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd832357fc27c81401c4649f71665861be412c47 --- /dev/null +++ b/model.layers.27.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9abb8e09ff5f89f58233c54e789fb86d6f0e459612510cb7ac48402e81ad95f +size 4326911 diff --git a/model.layers.27.self_attn.o_proj/data.pt b/model.layers.27.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..40153700478e55271ac603beb149045178cb8516 --- /dev/null +++ b/model.layers.27.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:282daba4a0bc069c1213b0f9b52278bc87d7b242fca72204059ab98857ff4cc4 +size 17303039 diff --git a/model.layers.27.self_attn.q_proj/data.pt b/model.layers.27.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ffff438b496409aa2179366cf2af35ff835734f --- /dev/null +++ b/model.layers.27.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43de53626e3bd178fea0dbc594a57f271bfe26c1abbb74dc6acbca0e76edee0 +size 17303039 diff --git a/model.layers.27.self_attn.v_proj/data.pt b/model.layers.27.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d8e700b9d91dca124da6b7703f63963ddc9b923 --- /dev/null +++ b/model.layers.27.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78657e2a455dbe6c9cb57ec2c491952125781bbe8bd77ee7f01ab77fc941b09 +size 4326911 diff --git a/model.layers.28.mlp.down_proj/data.pt b/model.layers.28.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7758fd1b950cdb5418dc5e675dd442c14d757e8 --- /dev/null +++ b/model.layers.28.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b627af95d78e9441367c2cf681d7ca45bb183c39262fbf4ab869a7b21d17d8 +size 60556799 diff --git a/model.layers.28.mlp.gate_proj/data.pt b/model.layers.28.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..64f24f39d282030b1a444798066b1acd9596c50f --- /dev/null +++ b/model.layers.28.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8988e0d32a0706dc3a7528bcc27299ebdb049c5486d8c54ce06503179637c35 +size 60556799 diff --git a/model.layers.28.mlp.up_proj/data.pt b/model.layers.28.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd1df096982e6f50f45f1f41b95a8967ef28f239 --- /dev/null +++ b/model.layers.28.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5425bb977ccee6519f9ca41174ee483a591990a760d263c7e83d70591f79e8 +size 60556799 diff --git a/model.layers.28.self_attn.k_proj/data.pt b/model.layers.28.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ee4362ee69f336a14e14ed768822fd57992c4c --- /dev/null +++ b/model.layers.28.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6714c905d7e2471176dece415feab5dd0fb66011b518a1ceca2240dfc35b00 +size 4326911 diff --git a/model.layers.28.self_attn.o_proj/data.pt b/model.layers.28.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d4452a9d609d7c04789cbd22f6bf3fea8b02fcb --- /dev/null +++ b/model.layers.28.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b84f33bc3d5e19f61417e95704675e070f5c1a7e5d05e8b35981f6937f9920c +size 17303039 diff --git a/model.layers.28.self_attn.q_proj/data.pt b/model.layers.28.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f2abf11a9e9b3139460156c24e0a7d1ebb344a5 --- /dev/null +++ b/model.layers.28.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd90e815955caa013185f4bee31eb81bfb6d0a45e804a3f7ba1aa79de399de02 +size 17303039 diff --git a/model.layers.28.self_attn.v_proj/data.pt b/model.layers.28.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe62b12484e68f2e1a75c07d6e6f2621b435710 --- /dev/null +++ b/model.layers.28.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a62f90b85a468be5f4ad05b734951592115f680715490815e95830a62b668746 +size 4326911 diff --git a/model.layers.29.mlp.down_proj/data.pt b/model.layers.29.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..95551b1fe966bda5acfe93b9503804a19bb1ac10 --- /dev/null +++ b/model.layers.29.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:037fed3ceff38d76855578ab7de8118b48e5d346d101f6837c3ded08a1bb4f4a +size 60556799 diff --git a/model.layers.29.mlp.gate_proj/data.pt b/model.layers.29.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b80c783d96b20e98391e5f44e773dcf205a3b1b --- /dev/null +++ b/model.layers.29.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22937f04e7503dd2577d331efc0158c6b140e8c9752074a24e55201c0947efa1 +size 60556799 diff --git a/model.layers.29.mlp.up_proj/data.pt b/model.layers.29.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc6e88b60b0b85ddf8a0519e93ca43f7e988cb14 --- /dev/null +++ b/model.layers.29.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:955440264b0a72673c21f6ddf118e0b25c02e0b0b2d76300e6e1f408b18a296c +size 60556799 diff --git a/model.layers.29.self_attn.k_proj/data.pt b/model.layers.29.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b6a053f4b506df10f42fd40e6d7b848c960812 --- /dev/null +++ b/model.layers.29.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adb4535d514554fcbea30897722f9dd9723780c11c657c7dd8689c8b05143bb4 +size 4326911 diff --git a/model.layers.29.self_attn.o_proj/data.pt b/model.layers.29.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e53e403cc86afd2367d1591306fdf77ff7432baa --- /dev/null +++ b/model.layers.29.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31242110d7274e77f3404868a24cf8bc37127c5a74868f3c4369f9a88ca4673e +size 17303039 diff --git a/model.layers.29.self_attn.q_proj/data.pt b/model.layers.29.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef1b641a54587710a2e9ba1c70aa069490980365 --- /dev/null +++ b/model.layers.29.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14aaaeb888801e68fccf35b279ff494c256f04593eb5c1534ac878ac29f26c36 +size 17303039 diff --git a/model.layers.29.self_attn.v_proj/data.pt b/model.layers.29.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c596f81e44c524f99b2f7f49b43f41a3393cacd --- /dev/null +++ b/model.layers.29.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80675eb0111cd6bc27f90485803dde6808f962ee6ecc7d2e058ed654a9ce89fa +size 4326911 diff --git a/model.layers.3.mlp.down_proj/data.pt b/model.layers.3.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e9057080db9959f7eb121988a3d232466cb3c03 --- /dev/null +++ b/model.layers.3.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe16228c3ec82d89b63a40251a99e86081d2d4a52a13664a9d9d97bbd8a5766 +size 60556799 diff --git a/model.layers.3.mlp.gate_proj/data.pt b/model.layers.3.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8ff5a5e2d9719e9023cbeda71d1913ffbaff6c1 --- /dev/null +++ b/model.layers.3.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780677869d4a11794dbeeaaaf76319cd27893745fb7bc080e7c4a4f74783da1f +size 60556799 diff --git a/model.layers.3.mlp.up_proj/data.pt b/model.layers.3.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bdecf5346fe6c96163a5fc21d6189850f63fbc2 --- /dev/null +++ b/model.layers.3.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e378fba7bbaeedc77d45c4e312ecd19cd6445fe2fd3c97a213238e7cbca29731 +size 60556799 diff --git a/model.layers.3.self_attn.k_proj/data.pt b/model.layers.3.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ba52f1778732fa5c9dd90c18c0f3fd8f44d5f9 --- /dev/null +++ b/model.layers.3.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6f600bec336dc03288421e2f100471ca46b9824626f373a764e1051e7c7090 +size 4326911 diff --git a/model.layers.3.self_attn.o_proj/data.pt b/model.layers.3.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4545275d4b3793c522e2aa751dd8d575ebfa157 --- /dev/null +++ b/model.layers.3.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa1cdd421c3323b742045a67307de59ec80c2ddb75cd69471e0e358ea5dc73a +size 17303039 diff --git a/model.layers.3.self_attn.q_proj/data.pt b/model.layers.3.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..454d6dedb3ed1ce5cbb0cdd2a5251643707ca5b6 --- /dev/null +++ b/model.layers.3.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b30f0bc21ebca6abce501f781f9cbd2e86da0ba4e61ed2893ba4db9c3d19a2 +size 17303039 diff --git a/model.layers.3.self_attn.v_proj/data.pt b/model.layers.3.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a943273a3bcc5588299f4f720143cbe217c80ae --- /dev/null +++ b/model.layers.3.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b67876b1bde977605bf342fa871e58af26e3d585bfcdc5eaad0af117e38a2c49 +size 4326911 diff --git a/model.layers.30.mlp.down_proj/data.pt b/model.layers.30.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9791f947e08324c216b8544b3b45a2c6bc5272 --- /dev/null +++ b/model.layers.30.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a635079c1edf7da8eff8ecc961d8e4706f206ab50ddd2ca2472c9063ad488c17 +size 60556799 diff --git a/model.layers.30.mlp.gate_proj/data.pt b/model.layers.30.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6ee18a88b28ae648ea25564c25c7eebd890a08 --- /dev/null +++ b/model.layers.30.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ffdc24579bbecbdcce255eb957fd13d17ae44dc08a1c1a5f5827f8367510066 +size 60556799 diff --git a/model.layers.30.mlp.up_proj/data.pt b/model.layers.30.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7239d35e5931e25716f785c7d7ad8b3950b86d02 --- /dev/null +++ b/model.layers.30.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6310af82625ff1bf572abd54610b650e37781ca4f105d99e9400060ea38ebcfd +size 60556799 diff --git a/model.layers.30.self_attn.k_proj/data.pt b/model.layers.30.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5e144eb24dda4e9d276125b0743a63fc9c9e2c --- /dev/null +++ b/model.layers.30.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ce57119526b11b33c14296095bf6547f16517daba2293f0f9b177c6789b53c +size 4326911 diff --git a/model.layers.30.self_attn.o_proj/data.pt b/model.layers.30.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c6affea21565de812e7d7c088d84bec89d0c4b --- /dev/null +++ b/model.layers.30.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4915efac9effc571f71e2c033fcdb9c1aa5413626669c2a86b28742d142501b6 +size 17303039 diff --git a/model.layers.30.self_attn.q_proj/data.pt b/model.layers.30.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1bd3cc83684144657b80a68d59fa9a47f774e74 --- /dev/null +++ b/model.layers.30.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16783722c480313e61bfc52c6abf95f17c19f5b61fe2dcc90961b7e121f97ad7 +size 17303039 diff --git a/model.layers.30.self_attn.v_proj/data.pt b/model.layers.30.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..10470ef4321959743147fc3d3dd50b915af9e1d2 --- /dev/null +++ b/model.layers.30.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b902e579dddfae13d9f4f6e1937c14d912cf0f96b4521968ea6a2725831799ad +size 4326911 diff --git a/model.layers.31.mlp.down_proj/data.pt b/model.layers.31.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a2ec58cfc92fe3d2424208d1198276d9a7660a4 --- /dev/null +++ b/model.layers.31.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b0e5b1e2dc8256184238294a50da9e1aec7e666ccb43d7a2bad12dc6a50af85 +size 60556799 diff --git a/model.layers.31.mlp.gate_proj/data.pt b/model.layers.31.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bc934bfa0a6795c911e01f76e977fafc5afc6a6 --- /dev/null +++ b/model.layers.31.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dac2f49df47ade80ce1de17827597d9e130635400fadb58ea9721a8c1432f9a +size 60556799 diff --git a/model.layers.31.mlp.up_proj/data.pt b/model.layers.31.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b059cd3b828c76005b156da41261adb8b8b5f00 --- /dev/null +++ b/model.layers.31.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc781e48433621231e85908e248261e2c52d2808b03af4b1d3517587be467c9 +size 60556799 diff --git a/model.layers.31.self_attn.k_proj/data.pt b/model.layers.31.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..42710123f372da9dedf7b1f79cda6986b35e7f57 --- /dev/null +++ b/model.layers.31.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555069524b705f80cbae55074458660f9493f85bb48a2d54fdc251ab6e14e89a +size 4326911 diff --git a/model.layers.31.self_attn.o_proj/data.pt b/model.layers.31.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..81226461b8360dda60452afc6db63c42bce2bb34 --- /dev/null +++ b/model.layers.31.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b277272995c8c728130e1ad8b0ae2bef6b070d4002014c10abe79d2be45185 +size 17303039 diff --git a/model.layers.31.self_attn.q_proj/data.pt b/model.layers.31.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a150df69974a455d488ce75047e74835e3ed3b93 --- /dev/null +++ b/model.layers.31.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd299b41368c6ff94df4e92195839472ed46ae5141eb4a9fb5cf4077e4ef2fd9 +size 17303039 diff --git a/model.layers.31.self_attn.v_proj/data.pt b/model.layers.31.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7352ea8f98df1e5adb93269d5abec37a9328b84c --- /dev/null +++ b/model.layers.31.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51261cbf1dcabe814b35ef05a89235a0d059843352da0b519f362353e479a8b +size 4326911 diff --git a/model.layers.4.mlp.down_proj/data.pt b/model.layers.4.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..0207e55a698ce368941e9ada692a1e47631ded8f --- /dev/null +++ b/model.layers.4.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e523559c565e18aca7650c4ce53433c3e91879ecfd6b81267468a1c13a2cbcea +size 60556799 diff --git a/model.layers.4.mlp.gate_proj/data.pt b/model.layers.4.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b844277bb0c89424cf5fcdb33a5b06b13a3d95cc --- /dev/null +++ b/model.layers.4.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26833f2ad94c8f0e8c0691408f616d83b476b0fb17ba2aa35a7c16b72ccb382 +size 60556799 diff --git a/model.layers.4.mlp.up_proj/data.pt b/model.layers.4.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..92cf37f1b7f5e5197401b7a026d581a7ddd17aaf --- /dev/null +++ b/model.layers.4.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61c76906aa1cc810309ca2161d94d3a0877a6bc213152ee49806b877f3a6813 +size 60556799 diff --git a/model.layers.4.self_attn.k_proj/data.pt b/model.layers.4.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b94823db582fa4afb601ec6cc41a6bc9e0adc15 --- /dev/null +++ b/model.layers.4.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782aa90fb1d713713102af3c51d059dba9839e6e0433c15a30f0ea945ccc6f0d +size 4326911 diff --git a/model.layers.4.self_attn.o_proj/data.pt b/model.layers.4.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68cfbe5b08450c3efd53942631d99bc07bb920c --- /dev/null +++ b/model.layers.4.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c0a67567cd7dd61559186bc9e6da0b1370e6ac129a0d089193e3b68fee0260 +size 17303039 diff --git a/model.layers.4.self_attn.q_proj/data.pt b/model.layers.4.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a232cb126f1ef737e1f91a09c164afcbfadb51a --- /dev/null +++ b/model.layers.4.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c85290228664964552f883af0fd7175b45c85818c258b6f76c4b3b7af305a0f +size 17303039 diff --git a/model.layers.4.self_attn.v_proj/data.pt b/model.layers.4.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbcd6aced348bc4da346861c9e5e89df0148b0a --- /dev/null +++ b/model.layers.4.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1424e363061df00624e0a7dc58f3f7824d316af5edcf9af7a5b14a9641520b7b +size 4326911 diff --git a/model.layers.5.mlp.down_proj/data.pt b/model.layers.5.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..27dd787f60a9d47e07756eae839942294b78aaaa --- /dev/null +++ b/model.layers.5.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e858740555f724113f350f9d0637997051489e99ff9be0e88a9ac107a6ac173f +size 60556799 diff --git a/model.layers.5.mlp.gate_proj/data.pt b/model.layers.5.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f53e366eafdc5803c8da42ab6f8a4f40b140679 --- /dev/null +++ b/model.layers.5.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92321b583f891f032e4da26fafd0fc2626b5a04e860f1fabe9fc79b26014ed3a +size 60556799 diff --git a/model.layers.5.mlp.up_proj/data.pt b/model.layers.5.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9feafed5396dc7efaf182d3eaa665f91e3dd22e --- /dev/null +++ b/model.layers.5.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0aff8061e0910047a5879cd57a04c9ee4a88847cfe7f5235d563d3552f73fa +size 60556799 diff --git a/model.layers.5.self_attn.k_proj/data.pt b/model.layers.5.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a974d5797e57fdc06de759d2585cc108bb252eb0 --- /dev/null +++ b/model.layers.5.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6013f65ceb16dfc5f5309590021f125b0566b9ea5c9a733927429d93b36c4a1a +size 4326911 diff --git a/model.layers.5.self_attn.o_proj/data.pt b/model.layers.5.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..aabefb0a58a0d3179503ed3bb3be8ccdcfefeb26 --- /dev/null +++ b/model.layers.5.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2988bcf18715d556dcfdbda3220f623e252195bbfe3b49d2aeb92f4a3da7cb3 +size 17303039 diff --git a/model.layers.5.self_attn.q_proj/data.pt b/model.layers.5.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..efed13c7d0601c47c24507d62ea07a29f37c3b64 --- /dev/null +++ b/model.layers.5.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d6ecbcc16a037b81c5d3c4f5d7c490e8f5c0dd45c8b4c9ec7fa08553f19aa6e +size 17303039 diff --git a/model.layers.5.self_attn.v_proj/data.pt b/model.layers.5.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..60cf90839eabed790f6ddbd07042260c9d9026ed --- /dev/null +++ b/model.layers.5.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb3d85ba7274bbb461e5db2c6aa3312c10b3a029d3bfd957510613fbf843d7d +size 4326911 diff --git a/model.layers.6.mlp.down_proj/data.pt b/model.layers.6.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c0dbeb54388d0052f2ff28412a6e12b36ad4c9 --- /dev/null +++ b/model.layers.6.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e54209d3114d731c13d50bbf3359987d759da52255828c29f7b5cd61340d101c +size 60556799 diff --git a/model.layers.6.mlp.gate_proj/data.pt b/model.layers.6.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d75c9158573894540d22bf5a72d00008adac080e --- /dev/null +++ b/model.layers.6.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740472bc8b4b7e03c49a5f2c0e5675ede17ef9451e582c6c8cf1b6bc93ef574e +size 60556799 diff --git a/model.layers.6.mlp.up_proj/data.pt b/model.layers.6.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..7538b8de5fb8edec7d3a399a167aa268250c346e --- /dev/null +++ b/model.layers.6.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3d6e4fc0f2f18933fb0173dae8194ceab82b1783bb518c1d09487364d199552 +size 60556799 diff --git a/model.layers.6.self_attn.k_proj/data.pt b/model.layers.6.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dfe788f3dd719d3b93d90d7360c44057c2503d3 --- /dev/null +++ b/model.layers.6.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e59ae11d23e8c25837a48fbcb6fd65f043cf34d8397f2089454ebffc8940eac8 +size 4326911 diff --git a/model.layers.6.self_attn.o_proj/data.pt b/model.layers.6.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..53645ca08c3ae31b054caacfb77331e4d6e330ba --- /dev/null +++ b/model.layers.6.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08264e3daf4a27f72728fe84eedf3b73e9493ebeaeb71ab58bc56431a27e8837 +size 17303039 diff --git a/model.layers.6.self_attn.q_proj/data.pt b/model.layers.6.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..637fed17ca48a963e900d8823384521db620b683 --- /dev/null +++ b/model.layers.6.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcfded2e9b70d4c16594fdcddb03d12b5b1260388ce5d5ff43e34257fc69ac3c +size 17303039 diff --git a/model.layers.6.self_attn.v_proj/data.pt b/model.layers.6.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f89649dfe6dc9a469bcf40dcffe6b9a171bd5903 --- /dev/null +++ b/model.layers.6.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d39b7a5dd0a2510e47d01bacaa85038bf1203646cd3b26c587182fb4a390c1 +size 4326911 diff --git a/model.layers.7.mlp.down_proj/data.pt b/model.layers.7.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..37d1b7c164237b8ca32334fb966a0981053e78b4 --- /dev/null +++ b/model.layers.7.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c4cf230565d4a180b6d923a9ad780da28d3e19e23fe230c305f8f70ea9a1d0 +size 60556799 diff --git a/model.layers.7.mlp.gate_proj/data.pt b/model.layers.7.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc31ad335eb6abdb4ce0a550dba50e4ab3ba140 --- /dev/null +++ b/model.layers.7.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8552f1fdae9cdf38dfce196302412d59b7fb03f4ce2dd117770d6bfa21b1045 +size 60556799 diff --git a/model.layers.7.mlp.up_proj/data.pt b/model.layers.7.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..330a066c542dca1b057643549b6df0294c482598 --- /dev/null +++ b/model.layers.7.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa7f648ed0b349f0ab2a04406e59c052e4ef647eda6cd2aded295a8650b2660 +size 60556799 diff --git a/model.layers.7.self_attn.k_proj/data.pt b/model.layers.7.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f937977733ab5ca98717262eebba68f9db95a014 --- /dev/null +++ b/model.layers.7.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb04bd1f9a77e25f907d890154f0b735953234b7202873a02a083d3d57108d6 +size 4326911 diff --git a/model.layers.7.self_attn.o_proj/data.pt b/model.layers.7.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a74c0e0cdd429caed2bf23baef1b3e2997d54d31 --- /dev/null +++ b/model.layers.7.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1e16bc7938f370fbea1772d492cef07189ebeb82fdc1282ec8cd1bb4e435a6 +size 17303039 diff --git a/model.layers.7.self_attn.q_proj/data.pt b/model.layers.7.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9369df0d82bde74974a29d1480cf5ae9a94a309 --- /dev/null +++ b/model.layers.7.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5270d1f0eaf5ebe5a249aadb5fe2a6176c9e7a1f43a305fde7f1d793a404a4d +size 17303039 diff --git a/model.layers.7.self_attn.v_proj/data.pt b/model.layers.7.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..5126a1d9dbfa5860f97563a8bd2d3d0a9868ef15 --- /dev/null +++ b/model.layers.7.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ce43dcc52df8dcc90dc53a1d26512e07b26bd5aef0984063bcb28061e545b9 +size 4326911 diff --git a/model.layers.8.mlp.down_proj/data.pt b/model.layers.8.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..9283a4bf380e45dd06ef2d61d4f5d90a3892709c --- /dev/null +++ b/model.layers.8.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5332d2501c83724808997c662a1f53e0da68f8f3b8a93d6ad2cbea5e5829838 +size 60556799 diff --git a/model.layers.8.mlp.gate_proj/data.pt b/model.layers.8.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..b594ea5e12a2b50117c52c731231b9f590ed8335 --- /dev/null +++ b/model.layers.8.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc34123d617fff1012db2829b1e855cce28b1cd39480d9e1ec02559663a7e1af +size 60556799 diff --git a/model.layers.8.mlp.up_proj/data.pt b/model.layers.8.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..90de3e7c7063672e307bb712f749e8772a1495d5 --- /dev/null +++ b/model.layers.8.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a677383fbce4f9610b071ea141a4089206c8b11580f70f0286a39f4fb8fcdc98 +size 60556799 diff --git a/model.layers.8.self_attn.k_proj/data.pt b/model.layers.8.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad193ce4ddc73eb7e3a8b8cd9538c42b6afe3ad0 --- /dev/null +++ b/model.layers.8.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63d2829bb3498cf431a49c6de6582691289968c059614ae13670816b256e0d6 +size 4326911 diff --git a/model.layers.8.self_attn.o_proj/data.pt b/model.layers.8.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce12dfe6787042e68a8b72889f17ae619021a7de --- /dev/null +++ b/model.layers.8.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58065297051bd8f8ba081b7a533577030d9d336c1ef8287dcb3f3574a1eb3a2b +size 17303039 diff --git a/model.layers.8.self_attn.q_proj/data.pt b/model.layers.8.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee262cef85c81adb4844f290a1efd206445ac8d --- /dev/null +++ b/model.layers.8.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f525107b8c2f5ca8db5c06010fe6f1c0bb20b7b7d2cf03cd1799c63ea79f03 +size 17303039 diff --git a/model.layers.8.self_attn.v_proj/data.pt b/model.layers.8.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..817912c2c29b47f74def738ae6c93895f7b7743b --- /dev/null +++ b/model.layers.8.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa571d0d8d9ca564246e6681f13d38f0954dc588fcca92fde427f7b66c99a4b9 +size 4326911 diff --git a/model.layers.9.mlp.down_proj/data.pt b/model.layers.9.mlp.down_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..34381ec05105b0fd03c83cba9407b19a67c0dd86 --- /dev/null +++ b/model.layers.9.mlp.down_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ba57400e79b352760685322ff6409cdfd245dab3320dcfc1fb8191460ed9643 +size 60556799 diff --git a/model.layers.9.mlp.gate_proj/data.pt b/model.layers.9.mlp.gate_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d0e66f4981130f1e626e948d0c69f233d4c64dd --- /dev/null +++ b/model.layers.9.mlp.gate_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd9ff0d6c3f2600f1b74457d458f178709e8036d75990ea550b7c53d8c852ed +size 60556799 diff --git a/model.layers.9.mlp.up_proj/data.pt b/model.layers.9.mlp.up_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83e6424abc8f73df25792d0af013889a920eaa6 --- /dev/null +++ b/model.layers.9.mlp.up_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60d3752add9ee75a171b95d5b964a2ea27e750d9bcd3f3aa1bda8e54d6f4146 +size 60556799 diff --git a/model.layers.9.self_attn.k_proj/data.pt b/model.layers.9.self_attn.k_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..82db1af42eb5bfd7cb2e51f12d9482d09d9723e7 --- /dev/null +++ b/model.layers.9.self_attn.k_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79d87e36e857220f08b1953286ef755923d0156e41faec61f70d669cf2088315 +size 4326911 diff --git a/model.layers.9.self_attn.o_proj/data.pt b/model.layers.9.self_attn.o_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e0a2c2217a855eec9b5c9f06354b26baaf53cfd --- /dev/null +++ b/model.layers.9.self_attn.o_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:431d2aefbe1344bea0ba913a04bbeefbf867afc6bbb562b906c47e3747a1b1fd +size 17303039 diff --git a/model.layers.9.self_attn.q_proj/data.pt b/model.layers.9.self_attn.q_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..1188f7430df14d8f5a45bf91a0c8c095bbee8db5 --- /dev/null +++ b/model.layers.9.self_attn.q_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdaa5d516fe46bca97836eb566cab6fd1d8bec4beb1eee17741b6e31eb18e413 +size 17303039 diff --git a/model.layers.9.self_attn.v_proj/data.pt b/model.layers.9.self_attn.v_proj/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b12fb562b226536400635f7b396ef083efd60d --- /dev/null +++ b/model.layers.9.self_attn.v_proj/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92529d9075451a4ec277146d4b9350286f1ca6ad031f83ccb77e61a58e2468eb +size 4326911