diff --git a/checkpoints/comma/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6491de0d0ff9f671f5ad262230379928e85cc71b --- /dev/null +++ b/checkpoints/comma/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748fa192c998c3ee4bdbf22c2107c4478cca6f1801bf9fa0ef165c62b4b2fcc1 +size 8388848 diff --git a/checkpoints/comma/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e78a58864a26df142502c8f25eb91f61d5323f9d --- /dev/null +++ b/checkpoints/comma/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdeaddd631a332791660f25c4a4ca5ad57d323f11b81380d830563b184777bcc +size 25166176 diff --git a/checkpoints/comma/model/decoder/0/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/0/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..befa07cb22aeb3a5b86f196f0866a386bd21aa70 --- /dev/null +++ b/checkpoints/comma/model/decoder/0/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a29e6f52e8f77dddb10a31eba77d8f650e890730eb527b2ccda98bc5fb049bf +size 4192 diff --git a/checkpoints/comma/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..738dd6e457e26a732a0476b3a750ed4fd6c75c8c --- /dev/null +++ b/checkpoints/comma/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4ca278098764cd17064296b5fb71e065380c32a35da54f2c97499f162120fc +size 33554672 diff --git a/checkpoints/comma/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42aea8858145a93e56c2534662cb30e09f752198 --- /dev/null +++ b/checkpoints/comma/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5b2e95abb0e3878f2a76c89de2f4e23bcd76a8290aa554635ca651464910b6 +size 67109160 diff --git a/checkpoints/comma/model/decoder/0/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/0/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4fd1de939ef74ceebeb5b94f9e31f7764d2079a4 --- /dev/null +++ b/checkpoints/comma/model/decoder/0/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd0b8fff3fbd3655e34f3bef60ea2fbf4771531090d158d28e7d248cc860627 +size 4192 diff --git a/checkpoints/comma/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e3fd7b6a8a2aeffee9c6d8d286476c2fada6d02 --- /dev/null +++ b/checkpoints/comma/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71483746720b042d1d6d21c5acb2a47fd0612ae88bef6007c41447b96256302 +size 8388848 diff --git a/checkpoints/comma/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3004e217a2ab29d7910bc1aa0f653668323359e2 --- /dev/null +++ b/checkpoints/comma/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f54d9b1ed225f1c6569c37790d5b397c625659bacf201509c28b5de5ea5b0368 +size 25166176 diff --git a/checkpoints/comma/model/decoder/1/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/1/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9da8bd57a196aac1759ae861fe0fa2f632509e3 --- /dev/null +++ b/checkpoints/comma/model/decoder/1/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab918e008207025a9d6c71b170bcc2f176f7b7af0822a0e5161e0dd0972a662 +size 4192 diff --git a/checkpoints/comma/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..764a35f2c1a260362ebc6f4c62df71b8962d6a2a --- /dev/null +++ b/checkpoints/comma/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6860751d0485ffbb527620d1c56042d94d6395c42a6cf0be2773519f11a47280 +size 33554672 diff --git a/checkpoints/comma/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6bd25b3de319ff9b11b4d8bcd205ba1beafac68 --- /dev/null +++ b/checkpoints/comma/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a71db5192fe3e883f197182b264e7f373f9aa377638aa4efb0056d43e68f39e +size 67109160 diff --git a/checkpoints/comma/model/decoder/1/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/1/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7369138293c57da1ed916cc7b84201bf57fc51ab --- /dev/null +++ b/checkpoints/comma/model/decoder/1/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a585bcf0958a367775708fb0993e77f27f78db788a1a9db7f64b40220092524 +size 4192 diff --git a/checkpoints/comma/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7aca37414dcf6774964c96bb2ccbea8189531eb --- /dev/null +++ b/checkpoints/comma/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27362ea8ac1e268cc9380e95398b4fd74be2718d5a0878013b9b4150e643fe6e +size 8388848 diff --git a/checkpoints/comma/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..acae3f9cc7a4f8331159b5577df7d579986fe6ff --- /dev/null +++ b/checkpoints/comma/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bb1df834b00dc59f959aabc1a154f98167abf875e9c72fc5b5a80f9bdba8032 +size 25166176 diff --git a/checkpoints/comma/model/decoder/10/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/10/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..77157a6f8e2f7fb4443254c69daa83394084aac6 --- /dev/null +++ b/checkpoints/comma/model/decoder/10/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70d1772d91b84d74b91fdf43e80743908bd144251927ef44c9189f520bc3ead +size 4192 diff --git a/checkpoints/comma/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6feb9eca0d11d6f5b8933382a7795b5050dfc37a --- /dev/null +++ b/checkpoints/comma/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea02d217c7666ee434bea9d7e0a49cdb9e5d1311772de43692916c38bffbdb +size 33554672 diff --git a/checkpoints/comma/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d6e5ff4824ff5930e4cf07e9a940023f151318e --- /dev/null +++ b/checkpoints/comma/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c589dcfb875b1cd359c5c1933253b84b43fa22fccbf16aa1f6097b1e830f7b7 +size 67109160 diff --git a/checkpoints/comma/model/decoder/10/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/10/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d5453d359525da100befe7c6f42049b47c5262d6 --- /dev/null +++ b/checkpoints/comma/model/decoder/10/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c71d560dccdda85b8f06a87d5d39aecb6e3800187a2ba145a9b1758716503e +size 4192 diff --git a/checkpoints/comma/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..43383a7c3417741a2c76d3e3da75560d60498369 --- /dev/null +++ b/checkpoints/comma/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65691d131b44948fa99f661e51e8656c89e0a1675671d3c1091f93fd38336b73 +size 8388848 diff --git a/checkpoints/comma/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..868e546eaca5667fa5f32f290cb2f0242dc9be00 --- /dev/null +++ b/checkpoints/comma/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586b64b22a17c176e09e5a859166c68fe42e0841e720b8977e2ac3cc05dde523 +size 25166176 diff --git a/checkpoints/comma/model/decoder/11/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/11/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..240510bfa7067235ac7c087089a9cb8090de21fc --- /dev/null +++ b/checkpoints/comma/model/decoder/11/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f151d79434d6d116c17da83cc832d6455f5d9126d0f1917f2acd07f4c0f396 +size 4192 diff --git a/checkpoints/comma/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01d72e8b4128ec89fa90414d614805e9d3b3c1f8 --- /dev/null +++ b/checkpoints/comma/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2766b1452a74fa2e6ad2ed161da95f488ddc81b09feebb8f297dfe289e32d960 +size 33554672 diff --git a/checkpoints/comma/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2495d5eaaf0dce23e208d1dd98a410e328170d67 --- /dev/null +++ b/checkpoints/comma/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eeae92f3874c785306aee60e2486fc21bc8d560346baf2bb822316497a59566 +size 67109160 diff --git a/checkpoints/comma/model/decoder/11/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/11/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b7fdcce259f643b6ddd4872b74225ba6cc7a6fd5 --- /dev/null +++ b/checkpoints/comma/model/decoder/11/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77005f434a1feda713151810779c636aa4706e52f8acbbae3d0d140d0293618e +size 4192 diff --git a/checkpoints/comma/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f237a22ce5f37eed0319498051ff1b359a43804 --- /dev/null +++ b/checkpoints/comma/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e104ef87be1450ed632ef74ebe62c004579530becbb5da258f066d04cf41810 +size 8388848 diff --git a/checkpoints/comma/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abf1ff5a8a2b8f969b2a3cf889a3fad7dd1a53d5 --- /dev/null +++ b/checkpoints/comma/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0015c2d00b466af2a05f93af449ba71bdedfb020944e4514fb2728f1d8a34c42 +size 25166176 diff --git a/checkpoints/comma/model/decoder/12/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/12/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c68eea62bdf498867dbf5964d1d3f5633c60aafb --- /dev/null +++ b/checkpoints/comma/model/decoder/12/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56cd422219b6a372e0dca1d87446bff1be79e2f9070bc29bc284e8a4eb972b83 +size 4192 diff --git a/checkpoints/comma/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..20ff5c70052a6437ecca03301a1d9a5a5ae57fa7 --- /dev/null +++ b/checkpoints/comma/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee919f8f3631abac89be034a25e68e7903cb34f8c62b975a41a918ec0cc9cc64 +size 33554672 diff --git a/checkpoints/comma/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..335930d5f8aec0a317601874abc9286e52731304 --- /dev/null +++ b/checkpoints/comma/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860f9a9155bbc2b353d534a5abadee968e88106db45ac5a01b66085abb347257 +size 67109160 diff --git a/checkpoints/comma/model/decoder/12/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/12/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd4502493aaa509ce73dceed9742f63589341fb3 --- /dev/null +++ b/checkpoints/comma/model/decoder/12/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50089da1be2172e67844fdd4bc04f914643e1c748e631e95385d479f5efd6e7e +size 4192 diff --git a/checkpoints/comma/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..374fb531f0d44f25889671b6936e5d2a6e8dd7d2 --- /dev/null +++ b/checkpoints/comma/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6680891f624935f92542182ecfb1d238be887b476747499abbbdced7cce37326 +size 8388848 diff --git a/checkpoints/comma/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df45abb392a87434dbf873cff0c0fb9cf2c2b8d4 --- /dev/null +++ b/checkpoints/comma/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f9f9d7a202f82339439bed5d6f053b69942fd89743c4d632671875217f0e6f +size 25166176 diff --git a/checkpoints/comma/model/decoder/13/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/13/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3479af6175c635ffcf10cb8bc14756b015c09f3 --- /dev/null +++ b/checkpoints/comma/model/decoder/13/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4fb830a2a958f8b7bd4329aa457c6e9b26d4a9b7467132a9b99049fdc1f7aa +size 4192 diff --git a/checkpoints/comma/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bdf242a969a10d251f0b3f9750d9e52d023d2632 --- /dev/null +++ b/checkpoints/comma/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d4394323d320fbf1f8ed945548da79b09a3638762481f31fc2830d6bb3304b +size 33554672 diff --git a/checkpoints/comma/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..95c554cbddebb65ba3c736162d2db630176eac41 --- /dev/null +++ b/checkpoints/comma/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099886bb00160ef6c69f514fff8e5b6777c6a53282343356961b70e6c846260f +size 67109160 diff --git a/checkpoints/comma/model/decoder/13/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/13/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24ec99e8951f01ee74005ea344467ea87ad821df --- /dev/null +++ b/checkpoints/comma/model/decoder/13/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef776fc06112de765a2964e2096b31d325b9b3e9be978e1c44b7feb0ab4ff9db +size 4192 diff --git a/checkpoints/comma/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62357de00dbc62655e5c8596753bb9ff1b613fcb --- /dev/null +++ b/checkpoints/comma/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59293e4746d0753f2bb5b4b0f9b388a48d66fd917de8caa84c2e9ac884f3b6a4 +size 8388848 diff --git a/checkpoints/comma/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2267e3bcd80d1edae1f0af9e6ab9c1c990558cf0 --- /dev/null +++ b/checkpoints/comma/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7c2a9b259f85218e80b17eaa4720e4df29cfd1523cb73be042beba2f058e72 +size 25166176 diff --git a/checkpoints/comma/model/decoder/14/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/14/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..719be302a791ef8c4b74605d82310ca034706d18 --- /dev/null +++ b/checkpoints/comma/model/decoder/14/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dda319c945ff6944277d92bdc425dfb1fe955269c1dc01addac5c63def4a6b0 +size 4192 diff --git a/checkpoints/comma/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8634b33d66ba65988e8da8cb9ef3c9bf9f1f2a8 --- /dev/null +++ b/checkpoints/comma/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:056bc63709d2e0fbb4d2475f3cb54e6a9145af515875281cdb5f62315e21ca32 +size 33554672 diff --git a/checkpoints/comma/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b1deb351c9a6e35a523c594b3c8da71718454f4 --- /dev/null +++ b/checkpoints/comma/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04bd43c4acaa3672a8474e7cdd1d2a5e6c00c20217514ebd5717fb9648be425 +size 67109160 diff --git a/checkpoints/comma/model/decoder/14/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/14/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1409c42a03846ab252b573086400d8c41de0f6f --- /dev/null +++ b/checkpoints/comma/model/decoder/14/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25dcdb0bb8163061cf356d9211cf2a18df0d333e24a0566f069aac0f137af26 +size 4192 diff --git a/checkpoints/comma/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b7b003f0eb076f3f5235c796d90b3acbf296ac4 --- /dev/null +++ b/checkpoints/comma/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1252c9169764e401e800497c5dae87203b93b0301b1a56d5f6a33a9144d4d87 +size 8388848 diff --git a/checkpoints/comma/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..455c78276c3af51182c12b9822d4fb31586e57a1 --- /dev/null +++ b/checkpoints/comma/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66a3d34b50994125960eed552ef6d7335718a8d65ab7887f0ecb95a6f9d1670 +size 25166176 diff --git a/checkpoints/comma/model/decoder/15/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/15/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f1be10a324a5e1e9f9132b6fb70ffae37375474 --- /dev/null +++ b/checkpoints/comma/model/decoder/15/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b0e5419edd2c6751181222e9072bd4c80eb8f2418a39f63df2a55ab83a6b29 +size 4192 diff --git a/checkpoints/comma/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2fe51a903dda58edef91470b1001d707b902c71 --- /dev/null +++ b/checkpoints/comma/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fd05ba9dc19076577eebc10cfb3c59d24e02d6638eb7158f47f9f13f8d9cd0 +size 33554672 diff --git a/checkpoints/comma/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5489acb099a939baec58621980161c4eaf7afb1b --- /dev/null +++ b/checkpoints/comma/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7870e1e2ef91714fdec2820b8b9f82b869cc5de6d7fa2de985335bceb6ded0b4 +size 67109160 diff --git a/checkpoints/comma/model/decoder/15/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/15/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..389d32f9133d4351cf166bfcb256ea92b5ae7af3 --- /dev/null +++ b/checkpoints/comma/model/decoder/15/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f795501d7da3080146067e7d598783fae743f4f55ac66056efc4cf9920d798d +size 4192 diff --git a/checkpoints/comma/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22ff46013ba8821ab71e247323e33693e10ccf46 --- /dev/null +++ b/checkpoints/comma/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a12b22754a35c1cb8915eb8d9dd3e509fe7584e2e8c384357d6e6c7b24280f +size 8388848 diff --git a/checkpoints/comma/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5377e768098b2ab14120e1907a167809b42d59a --- /dev/null +++ b/checkpoints/comma/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eb210d6708b1cb6e9036380d105646ab9d21b6f90784bb6899595d410c13cc +size 25166176 diff --git a/checkpoints/comma/model/decoder/16/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/16/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4de050b61127a58e6cf071eaab4a3b060b924e8b --- /dev/null +++ b/checkpoints/comma/model/decoder/16/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfce10502692992d9c50fff0b16e66f95d505a5408c6b114f9aaa865f72d396a +size 4192 diff --git a/checkpoints/comma/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce2bcda74fcd4b71a2eabb9745959d4c4c6b0fbd --- /dev/null +++ b/checkpoints/comma/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac69aec11e564461f01af129ea4a6a147b9b2448898a50fee54e3cb23ebfc7ec +size 33554672 diff --git a/checkpoints/comma/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..14e51aed55e9b505edefd6e30a7827a6cec28fef --- /dev/null +++ b/checkpoints/comma/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a4484a2718afacca5dd4e9bb1d11d9d6d843d06ddaee81c898e018b28d50894 +size 67109160 diff --git a/checkpoints/comma/model/decoder/16/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/16/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..19dc8fbd5626f86f5d2f7ce87583c11fd82a34c8 --- /dev/null +++ b/checkpoints/comma/model/decoder/16/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80afc18acb82da852118e6500d4e7c53d50b5c53473ddf7c21a71c32b95cf8c4 +size 4192 diff --git a/checkpoints/comma/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be70ba7206a45cce0e047befb9e10e5eff99900c --- /dev/null +++ b/checkpoints/comma/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d6bee48cdcfef3712dadd1e0464c126c8c4c15a137e3f6a70ca4ac1157b77f +size 8388848 diff --git a/checkpoints/comma/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39e65de6a5a83a741ed75f11c514dd62e82d88b6 --- /dev/null +++ b/checkpoints/comma/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973bce5fba8214d40f1bd2c5a9c8e0e659cc2231ed00113b5437056d87d070c7 +size 25166176 diff --git a/checkpoints/comma/model/decoder/17/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/17/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..acf0c566f72eafddf6fc4ecd75c9dd2dc364bbe5 --- /dev/null +++ b/checkpoints/comma/model/decoder/17/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee703ab9fb3dd5a71779116d0fd1ce408d934ae93819f68574824f2abd6b49d +size 4192 diff --git a/checkpoints/comma/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f7622678f18c969f55a962667bea73d48c03092f --- /dev/null +++ b/checkpoints/comma/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f64ba53e3bc0764122b91f5287b3d572d09adf8dd551496fe41c7f52b01a6e +size 33554672 diff --git a/checkpoints/comma/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ca813608b2f0a0151a1b466104bd7a48d95df55 --- /dev/null +++ b/checkpoints/comma/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3b56dc15fdcc0a7ae3a524603ba80948b4dd171cfd88e7501a43a8aa7fe540 +size 67109160 diff --git a/checkpoints/comma/model/decoder/17/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/17/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb1b104e5f75946d946c865e86f81f5a20b8d2a3 --- /dev/null +++ b/checkpoints/comma/model/decoder/17/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd5e604af6338622b9e782f63a5f33433e94786755d0f2460483f973defd911 +size 4192 diff --git a/checkpoints/comma/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..331e0ee35e4392354435892f4be48363a0e8a204 --- /dev/null +++ b/checkpoints/comma/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e320261f88eb0b4376441bae3f995d346c826c6f4b1f5bfb156a35a2e41d1c40 +size 8388848 diff --git a/checkpoints/comma/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f3296c5a25b61e223571dff2c3c79ce51ddbad90 --- /dev/null +++ b/checkpoints/comma/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e228ec07a7cf9f37de0e00cb36c8c14fc35eaf6a4a853a84326c316ad3118b +size 25166176 diff --git a/checkpoints/comma/model/decoder/18/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/18/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a115cb81a9315aa3fe04eb2a772300ee47dec09a --- /dev/null +++ b/checkpoints/comma/model/decoder/18/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fa7d3e1d63742d9a0b40f4b666193d9252434079668b0db28ded7201eed081 +size 4192 diff --git a/checkpoints/comma/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4f347d4a11e72fe427a074c94e6817af67a2fd4 --- /dev/null +++ b/checkpoints/comma/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90826368729edd3bb6989ab24482097c2a576e67e0d5f30bfd0ce37f713a0973 +size 33554672 diff --git a/checkpoints/comma/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1dd47ce6c26aa2ca49617894ce6eb8d65ed72556 --- /dev/null +++ b/checkpoints/comma/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46cf564166e6fa3772d9a52e35321af46563a8eadb18d1b35e598f2acf01562b +size 67109160 diff --git a/checkpoints/comma/model/decoder/18/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/18/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..207a157320991604a2d9a9ae8e7f1e6a1fc2bf1b --- /dev/null +++ b/checkpoints/comma/model/decoder/18/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac38195f77d7a0b576a2568754efaf092d327fea7987d7fd9bb280e64f5ea410 +size 4192 diff --git a/checkpoints/comma/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1ee05b1d0cb7065c03548503d7c8718671b47764 --- /dev/null +++ b/checkpoints/comma/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d31d636485e30ad25516a32fea38a22c148a17a685cb10ac7a85d06223d970 +size 8388848 diff --git a/checkpoints/comma/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e4c74c76937130409abf9d280242e47c90c19d32 --- /dev/null +++ b/checkpoints/comma/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6497bfe27154fb8cd5c2e642044bf60df66950d4901b853b40df34225a559b45 +size 25166176 diff --git a/checkpoints/comma/model/decoder/19/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/19/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..393fd195076cf58ccc6b902f29e55e5271261f8e --- /dev/null +++ b/checkpoints/comma/model/decoder/19/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a890468fa9d43cbe974f27c808b716c36a4b79dbad18ddd16e8e707e394da75e +size 4192 diff --git a/checkpoints/comma/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b7c62a83393f5463116b121467f18d5cee352276 --- /dev/null +++ b/checkpoints/comma/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428a45b166d0ee15fc9dc9d3992754fe726bd0cfc6875398f37aff81b62e76a9 +size 33554672 diff --git a/checkpoints/comma/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..75d2f1e65e05c282975742d9830147c566eee237 --- /dev/null +++ b/checkpoints/comma/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:512850ef934599c3919aa1cfb52bf9b219dc2c1155743305805abc8eed173e19 +size 67109160 diff --git a/checkpoints/comma/model/decoder/19/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/19/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f569a1dd5979d93b24128bca59cfff68b44b6292 --- /dev/null +++ b/checkpoints/comma/model/decoder/19/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52657aa23116aefd24ba52be35131b7fea143b69f3d54fba3052a1aae0a9708f +size 4192 diff --git a/checkpoints/comma/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2412efebac460dec167c6db19dbadec238708752 --- /dev/null +++ b/checkpoints/comma/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a38805f7a89288a0f42d80264035c6b192015b1b9f7a4ad187841bbc68e62a0 +size 8388848 diff --git a/checkpoints/comma/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d993631e723a01254a2b14c92a776535fd42759 --- /dev/null +++ b/checkpoints/comma/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5c3dc311b61963cd15dc578da2b2e12b77b675bf56b879b97e1806453bee51b +size 25166176 diff --git a/checkpoints/comma/model/decoder/2/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/2/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ab5dbc55871f77cb383af08ff3f5876f11b3ecd --- /dev/null +++ b/checkpoints/comma/model/decoder/2/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c8bf39ff33547807eda85a2f3650938c52f607b18c51c8e45daeaa1b726e42e +size 4192 diff --git a/checkpoints/comma/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a7c25d9855af028f5b75a9db6fc817073801e88 --- /dev/null +++ b/checkpoints/comma/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed12c0ff7cf0bf6d4eaebeb0cb1f23d28ba556517fe5c1e8dc95503a4ecc217 +size 33554672 diff --git a/checkpoints/comma/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b187864b6bbe791ee8ffdccae85ba7cb2b2db9e8 --- /dev/null +++ b/checkpoints/comma/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e1b94b02ae59c1c9d200c0167cc21d28c831071a3f6598dc5ab7e9f496213e +size 67109160 diff --git a/checkpoints/comma/model/decoder/2/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/2/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c24043f130e799279088bcd58389cb8fdcf4ab6 --- /dev/null +++ b/checkpoints/comma/model/decoder/2/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd553a996431a19b85b5388c3cf3aa788f57f53755ce2d5f33a234232521987 +size 4192 diff --git a/checkpoints/comma/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2dc3bc7750c8b896ef6aa99457502c32b1edeb2e --- /dev/null +++ b/checkpoints/comma/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0fb98b3b33592842da3e7de7524c7eda73607b2e63ae798159b726b36740f9 +size 8388848 diff --git a/checkpoints/comma/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8d0311f06f92ace8ba80a913ea3dba817984384 --- /dev/null +++ b/checkpoints/comma/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6cff413c86fdd90da3eacd4b898e0fbe2591ef1a6198d0eb0d0a7539565e93 +size 25166176 diff --git a/checkpoints/comma/model/decoder/20/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/20/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d2523ebef41c6ed1f02319704e3a15ec96f1f762 --- /dev/null +++ b/checkpoints/comma/model/decoder/20/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce641341a543ce25d7c20e172b236ff2b744f5d8eacf377cddd176f1d8c63546 +size 4192 diff --git a/checkpoints/comma/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c72829365919470d0c7f0ae5b6589e835d9e533e --- /dev/null +++ b/checkpoints/comma/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d90baa1aacae5ff8fadbfe699e330ca7cf12201ef61b5741d55ff00ab82cc0cb +size 33554672 diff --git a/checkpoints/comma/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..40b376a92b5d996dcf152525629e810b7ccd813c --- /dev/null +++ b/checkpoints/comma/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cae145f1fc12c16cddaf92d6ec64beb2f5461eb99c80898d9bd6e259acb9c58 +size 67109160 diff --git a/checkpoints/comma/model/decoder/20/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/20/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..15f486ba3c45c40b97abbc1acce675fa3389ba3c --- /dev/null +++ b/checkpoints/comma/model/decoder/20/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1762e20fe9ccdf0904862a11e0e305d613ff5510f050313dfcacf8e467ebba8e +size 4192 diff --git a/checkpoints/comma/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09cbaa45a60f583e82dc2bd3fc5c706315687582 --- /dev/null +++ b/checkpoints/comma/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9298c7da80f585e918148d419d098291c1f8a78e26bea83d8aabe94038a23c7 +size 8388848 diff --git a/checkpoints/comma/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a371e004e4f1de4b2f0917c20763a53b7f1f4b9a --- /dev/null +++ b/checkpoints/comma/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a50c6262f9a9820de8ab5a26251efad2f71027c399033d29354571cdd7075d +size 25166176 diff --git a/checkpoints/comma/model/decoder/21/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/21/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c0913b18c4f3e25b6d16e2cb1cc8f48946a85037 --- /dev/null +++ b/checkpoints/comma/model/decoder/21/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdd20673a52823b2553972063f65613f9099871fac5c4f7d4a3c4407495bd096 +size 4192 diff --git a/checkpoints/comma/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e07c0262002772c37e5c4f3fd3bc445da95bb3ad --- /dev/null +++ b/checkpoints/comma/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8083de5ad076c31e5aea6310096f3b40217a51bb3566baf8b749f4e947378c +size 33554672 diff --git a/checkpoints/comma/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d502c6d54781fb0386fb5a354d60d229e0eade5 --- /dev/null +++ b/checkpoints/comma/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd1b341f19420f3a0b544fe494791981e086c3add77d13f5f8d3d363f4c6d416 +size 67109160 diff --git a/checkpoints/comma/model/decoder/21/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/21/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..559f4cf20d6125f00900f4f2c7bf434b4b4b2e0d --- /dev/null +++ b/checkpoints/comma/model/decoder/21/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560550aa7ed0e7fa06f32bf7708a4151d9038c93c9a56b80419b9a5bc2a037df +size 4192 diff --git a/checkpoints/comma/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f16dd030861d2148e32e1f522d66761c37497534 --- /dev/null +++ b/checkpoints/comma/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab321d1a74be5f33af62c31014c99940baf6abe71ed58f3297d6d318ca80452 +size 8388848 diff --git a/checkpoints/comma/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..536cfdea9a80c5cb76017846122e7c9297236810 --- /dev/null +++ b/checkpoints/comma/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed268a33a3d0cd004c03f7b2dd1c2c06a3c3e209265e53ca3ba872930237cdf +size 25166176 diff --git a/checkpoints/comma/model/decoder/22/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/22/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0ed1a30ac632596a6d45e907b45093d9319d393 --- /dev/null +++ b/checkpoints/comma/model/decoder/22/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7450adb04b1086d0c5fc1ea6ed1c66bcd58688516230e93851dc63fa20709b +size 4192 diff --git a/checkpoints/comma/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8f18dbe36499da4558166fb012302ff5733631b4 --- /dev/null +++ b/checkpoints/comma/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e608564a1ac71c4fc9aa374e4da428610cbf1865498149c38e15204fd295747b +size 33554672 diff --git a/checkpoints/comma/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8eed8e5a92c2cd9601fcaab291465feacb7f72dd --- /dev/null +++ b/checkpoints/comma/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de025c6806f98cf4e948f332ee1bc490bb508f85ef6570b45579f63ae88bd43f +size 67109160 diff --git a/checkpoints/comma/model/decoder/22/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/22/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f84e0ebf4b815cbfb3bda04b10df4c8c679be09 --- /dev/null +++ b/checkpoints/comma/model/decoder/22/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08061eceb639a76548cd9c6099e26b632ff57c84b4d3fd66c0513dbc6b8522e +size 4192 diff --git a/checkpoints/comma/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f8b12b1ed0d1a0b716d341c500072d2fdd62531 --- /dev/null +++ b/checkpoints/comma/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32fa0b82a0af114b4fe60dd106bbbde85783f268b001f3f158fc4e805cda130e +size 8388848 diff --git a/checkpoints/comma/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68c6d7590e4d15a9658d4ab0d04f834d21e1019b --- /dev/null +++ b/checkpoints/comma/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e04db29275f75fff74173ca058bdabd7871500df2c59a86250329eeec480454 +size 25166176 diff --git a/checkpoints/comma/model/decoder/23/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/23/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d5f60102cd6d6a9150e17ddad4e2c5ebb320ae46 --- /dev/null +++ b/checkpoints/comma/model/decoder/23/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873d58c3b49587a978a68683837c58f67c8d48423b54d1806cc3630c3ec03161 +size 4192 diff --git a/checkpoints/comma/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..98dbb5a059c52f74dce4e5c79909147057846ef1 --- /dev/null +++ b/checkpoints/comma/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78c0d6339a40ad0dec817bf13322b672cb483a87550b526a2d2bc810726898a +size 33554672 diff --git a/checkpoints/comma/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4a2f3a90817dc88ac6273e6412212dca2c8da3a8 --- /dev/null +++ b/checkpoints/comma/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e675f8f67676d1300459be6894bc1e3e3c8b9eba6698c0d441c35fdf9716b952 +size 67109160 diff --git a/checkpoints/comma/model/decoder/23/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/23/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..955dc7f3d40e80bb7facf66cb59852a396bf54fb --- /dev/null +++ b/checkpoints/comma/model/decoder/23/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e8ada344b40aa7e4680df7a808097a65097577771edb8ed1cc3a382060c7bb +size 4192 diff --git a/checkpoints/comma/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6664c1430980cd4c30706a8bcd60f354460d41d --- /dev/null +++ b/checkpoints/comma/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65655f53e106db075a666c85a6fc4fb2d959f37ebae1991d044d52111a8e1895 +size 8388848 diff --git a/checkpoints/comma/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..633466803f324a16e8ba3329343e5c41e52e8cff --- /dev/null +++ b/checkpoints/comma/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f48fbb8ec4d216692fb2e52f8943cf5be686876a1ee13a0b7b762f0ca2ce90 +size 25166176 diff --git a/checkpoints/comma/model/decoder/3/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/3/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1da397826c017de2866331bf58dbd063d05189f2 --- /dev/null +++ b/checkpoints/comma/model/decoder/3/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15e3572a092e5cd21e26e932e01a0b14dbebe51e094c234b91c0cb5d4a1e387 +size 4192 diff --git a/checkpoints/comma/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9b6ef59d54149e80f62dd934ef5563bd34b38b8f --- /dev/null +++ b/checkpoints/comma/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44eee4315c7bd35b4c28441cad516fdb1d20f192fec8581450f64d5a2f45169f +size 33554672 diff --git a/checkpoints/comma/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b36ac9b2dc23a83ee9120101919696a24664aee --- /dev/null +++ b/checkpoints/comma/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df71ec906c9b8ba2fb8aecbd70b75e99bfd09b74b992f7cd32aff498357ed14 +size 67109160 diff --git a/checkpoints/comma/model/decoder/3/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/3/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..14d4a412a752d10488059c9b0097321185360ed5 --- /dev/null +++ b/checkpoints/comma/model/decoder/3/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1472541f5f0a7279c9206c21b6aaf43a25f5439cc9598c8257a6c7874991002 +size 4192 diff --git a/checkpoints/comma/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69035b0590af1ec1804bd82685e956d7d513e3ac --- /dev/null +++ b/checkpoints/comma/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b389d170ef9b1b749b72c231af9162b37da034c72f44b512da626965e742e7 +size 8388848 diff --git a/checkpoints/comma/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..902d55cf7407c551cd4b238460e330655e542eeb --- /dev/null +++ b/checkpoints/comma/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb4771ab8e040235dfec4e7bbd4e5269e07d41f04eab27a3fd7a2d152623852 +size 25166176 diff --git a/checkpoints/comma/model/decoder/4/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/4/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed9e33b77d0a73c603d932fc20f35cd68c28b595 --- /dev/null +++ b/checkpoints/comma/model/decoder/4/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86982c0ff58883dbd4d337411d7d9b003112bba3c8ae8f95222e9ae57dc7ca2e +size 4192 diff --git a/checkpoints/comma/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c959d855baf3730ebd124b9135301b90f4596ad8 --- /dev/null +++ b/checkpoints/comma/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b57ddb18b0eb1f1cb2dc7b610ef8f63c9bcf20b0c662049a762cff1903a136 +size 33554672 diff --git a/checkpoints/comma/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b83613642068ab91063807854bbdb9fb048544dd --- /dev/null +++ b/checkpoints/comma/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a646c66eb12b96754c9539e9176906ce4569c1c77b4738bb0a64c0fa77cad6 +size 67109160 diff --git a/checkpoints/comma/model/decoder/4/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/4/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2619a5a87d02879f1e21cba8a8e25c6a86f8796 --- /dev/null +++ b/checkpoints/comma/model/decoder/4/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb9788f192937accb1417588d66061e505f53060f7c09d300d0d03ac4c708cd +size 4192 diff --git a/checkpoints/comma/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f440f76bf3a7b4b335d1717a04daf7ba0c43ccac --- /dev/null +++ b/checkpoints/comma/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122df0b700b8aebc79658d1f359e0912829ca5ba55066f1340ff38ec8998759c +size 8388848 diff --git a/checkpoints/comma/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ade3573f7f06fe984a6475e6b113fc5e20cc05b4 --- /dev/null +++ b/checkpoints/comma/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7fb985ebaa7d7352cb810c833146089eb79e46d948d160ca8217c044b6934df +size 25166176 diff --git a/checkpoints/comma/model/decoder/5/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/5/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ff223bc3f27febcee16a73f49ea6f929b5f0946d --- /dev/null +++ b/checkpoints/comma/model/decoder/5/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50667cbc91d42e0518c3dcc2556f46d62ecfe203bf91accdda8aeb67d15a6d4d +size 4192 diff --git a/checkpoints/comma/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..216c660858c2e23bb6868fba463352752d2e7452 --- /dev/null +++ b/checkpoints/comma/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d53bc6d1637688881e9245f872917a55009b9c1a6b57b0f643f7c1545fb51621 +size 33554672 diff --git a/checkpoints/comma/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37a53c54e0957e11aa24677854b85c1879c57a80 --- /dev/null +++ b/checkpoints/comma/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d97cd40088b707e1d79f53fac589c5fcc7e09dd50352a3e1ba3eff0dfe66d8b +size 67109160 diff --git a/checkpoints/comma/model/decoder/5/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/5/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a55450e9cb0ba27132b827228b1ca9deec2be09e --- /dev/null +++ b/checkpoints/comma/model/decoder/5/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2121d96f3cc039a24293f45d09f914dbef58d50b3d4ad3e459662b59b234855c +size 4192 diff --git a/checkpoints/comma/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c082eebdeacd529039018bc34fd7d2600688a2a --- /dev/null +++ b/checkpoints/comma/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5286ccf5f1ebe57abeebd3f3580262dbc959346a1a4e5a0a5eeedfc79f13d6e6 +size 8388848 diff --git a/checkpoints/comma/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b24d80cb8a7c54b2746b3893b75d1a39c4524cfe --- /dev/null +++ b/checkpoints/comma/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfbf6c223dec7f8aba624d3c26161bb4d2cdff499cb43eceb8803e28ec344854 +size 25166176 diff --git a/checkpoints/comma/model/decoder/6/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/6/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..13a33e565d98821d1c2fa1d1b7c6c1ec1ec9394b --- /dev/null +++ b/checkpoints/comma/model/decoder/6/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72af0a961d4f2feeb66ba0386dde83c1f2dc5713ff36bfd0bbdaf56c1ee6397d +size 4192 diff --git a/checkpoints/comma/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ea127183f707cac7d029ef372b6b9938121be49 --- /dev/null +++ b/checkpoints/comma/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61423980dc5b4b58fe57a45d6dd16891f8b749fc776566a1f342f3212061b581 +size 33554672 diff --git a/checkpoints/comma/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e9660c2e77b741abd5c06b7f90f5d62430077bf --- /dev/null +++ b/checkpoints/comma/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987e86d70f7e3858e02e870bda5bfb1f02ff1d692516e8671b09f054baf12fad +size 67109160 diff --git a/checkpoints/comma/model/decoder/6/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/6/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e48f73c7d3f8faffe98307a4e090139bb8902c5 --- /dev/null +++ b/checkpoints/comma/model/decoder/6/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbff6dcfea92356bfec7101001fdb402ddade093bb2115df210fa4a610969455 +size 4192 diff --git a/checkpoints/comma/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4311aa635d02103e50ccbb6f0f8987871912d94b --- /dev/null +++ b/checkpoints/comma/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1532c1c8c94a5dbb6ae7cb51b9d9aecfb106728490b725ef1969d6f6a8026f20 +size 8388848 diff --git a/checkpoints/comma/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9e53b4974347e05e327cb8e433f2227d8f3bd67b --- /dev/null +++ b/checkpoints/comma/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee4b193683e187a04dace541bf108a9fe076865e8565ed078c047363f880d1f +size 25166176 diff --git a/checkpoints/comma/model/decoder/7/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/7/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aff773cc544b017bd65d4d477c7b5d355d674658 --- /dev/null +++ b/checkpoints/comma/model/decoder/7/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb501141e16f873e49bcd7a87c67b56ae97ab94de65138ec055067d5d1c2f1a1 +size 4192 diff --git a/checkpoints/comma/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db9b188dcc09b8ca26ba5568de8c10c25674943f --- /dev/null +++ b/checkpoints/comma/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b6b50abeb7174a89c0f76cade558759008ac74c04a9b7a0c3481318afc47838 +size 33554672 diff --git a/checkpoints/comma/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3a9e7cd2e913c2969bda8ed2a2c5d3753fec10c --- /dev/null +++ b/checkpoints/comma/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88d8fbcef5827237cca0ac76f14ac36b212b5ea5422990ca3c75eeb08a442c7 +size 67109160 diff --git a/checkpoints/comma/model/decoder/7/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/7/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..203492cee4103b0c3bcf3677637be67fedea710f --- /dev/null +++ b/checkpoints/comma/model/decoder/7/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264fccf57f03e64161733ea9fc23cd982593d9dbd501a3ebb8abf5cb9fc53af0 +size 4192 diff --git a/checkpoints/comma/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72a9d3253d82d179015362580b2b931a4e61e65a --- /dev/null +++ b/checkpoints/comma/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5faf9813b6519e909d216392e3a79b124739a119025b33337dbba1d4f594774 +size 8388848 diff --git a/checkpoints/comma/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2c7518f54e7f5bf2fa101bc4d3a28423a5e0c57 --- /dev/null +++ b/checkpoints/comma/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e217fbaabbcb6d5de9b4d26c9dc2bf357bfa601508e08ba949e93020749766b3 +size 25166176 diff --git a/checkpoints/comma/model/decoder/8/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/8/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69cd87cb8ffc404e5f0f9a8eb189e44b3bada991 --- /dev/null +++ b/checkpoints/comma/model/decoder/8/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a2b5b00886b53f3a76e55dfbc6b007cb0e15506634fa0c76dde504910ed866 +size 4192 diff --git a/checkpoints/comma/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..27430141e26c6dbf6cd7ed69ec64d6d0a50727d6 --- /dev/null +++ b/checkpoints/comma/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b42c82717968da370da6fe1204bcb27361354350fd560f3d7db4e1555b441d44 +size 33554672 diff --git a/checkpoints/comma/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b70fc8e7ef3de846066cbd35407d2a6b13a00ec2 --- /dev/null +++ b/checkpoints/comma/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e20f76ed964dcb673e407a8903ac675deaf15525ed4298826e74648229cef0 +size 67109160 diff --git a/checkpoints/comma/model/decoder/8/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/8/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..77b8125060cdd925a2459116161215b372382a5a --- /dev/null +++ b/checkpoints/comma/model/decoder/8/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15169a215ea8a231087b8056e8fcdfc2587934a5905d894032e1e3b0832a9a0e +size 4192 diff --git a/checkpoints/comma/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d61202e5f113a5d4fa6b96aed0d07dfa42622ac1 --- /dev/null +++ b/checkpoints/comma/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224f4cc170aff008571830dbeb2e37940be429ac8d9db491aa7caac5bec9b024 +size 8388848 diff --git a/checkpoints/comma/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00dabff0401cef490fe0d13b9c941e9fbfa86c94 --- /dev/null +++ b/checkpoints/comma/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f3494ce7363b597e4182783a90da3da58372fdf5cdea1a976c34d85b73ca193 +size 25166176 diff --git a/checkpoints/comma/model/decoder/9/pp_block/input_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/9/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6258ec6ef0109abf1ca1a052a2b939025e558fe --- /dev/null +++ b/checkpoints/comma/model/decoder/9/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83b6a9c906c5bad67e043dbeec46c66f0bde204c903a5835d14c82f4e23745d +size 4192 diff --git a/checkpoints/comma/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a4d9586d338feb3edcf1c32aea6d811b11a04ab --- /dev/null +++ b/checkpoints/comma/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d28b996a05bfb0cd23c38f87221a3686da6a7b90bcd200c1829eaebb774c6a +size 33554672 diff --git a/checkpoints/comma/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a8b74717bbe0dd7f0e7aeec1f60226bd8dfd352 --- /dev/null +++ b/checkpoints/comma/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78073d08cf664394a5df854242d47e69f40f1c38d2fb50b5be03d48796f3a89 +size 67109160 diff --git a/checkpoints/comma/model/decoder/9/pp_block/post_attention_layernorm/model_weight.safetensors b/checkpoints/comma/model/decoder/9/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..460ab5b573ab085b6c54f57917184dd52681f6b5 --- /dev/null +++ b/checkpoints/comma/model/decoder/9/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e8d7157515ff8d849622b613c49c52379342325171d5eb12149c0abd5804cd +size 4192 diff --git a/checkpoints/comma/model/final_layer_norm/pp_block/model_weight.safetensors b/checkpoints/comma/model/final_layer_norm/pp_block/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f3185e37b5d8a7ae9db4db50f5bf0e9e24019e7 --- /dev/null +++ b/checkpoints/comma/model/final_layer_norm/pp_block/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b77184f92a4c3beced2d74cf503cd177f84825df1d3484c16bf47b9abcfca8 +size 4192 diff --git a/checkpoints/comma/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors b/checkpoints/comma/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f21efac57ff86e6dfa4f5033300d07bb59b2b7d --- /dev/null +++ b/checkpoints/comma/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-0-of-1.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6eb99b845b59631e2b9ef5865d79b3a6f5e219ad096109f4943b7e279afe433 +size 205914352