diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..a5ed551576953bbaaa85d9a12e4fdcbdbdb84463 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,792 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/16/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/17/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/18/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/19/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/20/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/21/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/22/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/23/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/24/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/25/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/26/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/27/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..abb168643ca8e7e49ef30c94dec29381ab557a9e --- /dev/null +++ b/README.md @@ -0,0 +1,159 @@ +--- +library_name: easydel +pipeline_tag: text-generation +tags: + - easydel + - jax + - "llama" + - "CausalLM" + - "vanilla" +--- + +

+ easydel +

+ +

meta-llama/Llama-3.2-3B-Instruct

+ +
+ EasyDeL checkpoint converted from meta-llama/Llama-3.2-3B-Instruct. +
+ +## Overview + +This checkpoint is intended to be loaded with EasyDeL on JAX (CPU/GPU/TPU). It supports sharded loading with `auto_shard_model=True` and configurable precision via `dtype`, `param_dtype`, and `precision`. + +## Quickstart + +```python +import easydel as ed +from jax import numpy as jnp, lax + +repo_id = "EasyDeL/Llama-3.2-3B-Instruct" + +dtype = jnp.bfloat16 # try jnp.float16 on many GPUs + +model = ed.AutoEasyDeLModelForCausalLM.from_pretrained( + repo_id, + dtype=dtype, + param_dtype=dtype, + precision=lax.Precision("fastest"), + sharding_axis_names=("dp", "fsdp", "ep", "tp", "sp"), + sharding_axis_dims=(1, -1, 1, 1, 1), + config_kwargs=ed.EasyDeLBaseConfigDict( + attn_dtype=dtype, + attn_mechanism=ed.AttentionMechanisms.VANILLA, + fsdp_is_ep_bound=True, + sp_is_ep_bound=True, + moe_method=ed.MoEMethods.FUSED_MOE, + ), + auto_shard_model=True, + partition_axis=ed.PartitionAxis(), +) +``` + +If the repository only provides PyTorch weights, pass `from_torch=True` to `from_pretrained(...)`. + +## Sharding & Parallelism (Multi-Device) + +EasyDeL can scale to multiple devices by creating a logical device mesh. Most EasyDeL loaders use a 5D mesh: + +- `dp`: data parallel (replicated parameters, different batch shards) +- `fsdp`: parameter sharding (memory saver; often the biggest axis) +- `ep`: expert parallel (MoE; keep `1` for non-MoE models) +- `tp`: tensor parallel (splits large matmuls) +- `sp`: sequence parallel (splits sequence dimension) + +Use `sharding_axis_names=("dp","fsdp","ep","tp","sp")` and choose `sharding_axis_dims` so that their product equals your device count. +You can use `-1` in `sharding_axis_dims` to let EasyDeL infer the remaining dimension. + +
+Example sharding configs + +```python +# 8 devices, pure FSDP +sharding_axis_dims = (1, 8, 1, 1, 1) + +# 8 devices, 2-way DP x 4-way FSDP +sharding_axis_dims = (2, 4, 1, 1, 1) + +# 8 devices, 4-way FSDP x 2-way TP +sharding_axis_dims = (1, 4, 1, 2, 1) +``` +
+ +## Using via `eLargeModel` (ELM) + +`eLargeModel` is a higher-level interface that wires together loading, sharding, training, and eSurge inference from a single config. + +```python +from easydel import eLargeModel + +repo_id = "EasyDeL/Llama-3.2-3B-Instruct" + +elm = eLargeModel.from_pretrained(repo_id) # task is auto-detected +elm.set_dtype("bf16") +elm.set_sharding(axis_names=("dp", "fsdp", "ep", "tp", "sp"), axis_dims=(1, -1, 1, 1, 1)) + +model = elm.build_model() +# Optional: build an inference engine +# engine = elm.build_esurge() +``` + +
+ELM YAML config example + +```yaml +model: + name_or_path: "EasyDeL/Llama-3.2-3B-Instruct" + +loader: + dtype: bf16 + param_dtype: bf16 + +sharding: + axis_dims: [1, -1, 1, 1, 1] + auto_shard_model: true +``` +
+ +## Features + +**EasyDeL:** +- JAX native implementation and sharded execution +- Configurable attention backends via `AttentionMechanisms.*` +- Precision control via `dtype`, `param_dtype`, and `precision` + +## Installation + +```bash +pip install easydel +``` + +## Links + +- EasyDeL GitHub: https://github.com/erfanzar/EasyDeL +- Docs: https://easydel.readthedocs.io/en/latest/ + +## Supported Tasks + +- CausalLM + +## Limitations + +- Refer to the original model card for training data, evaluation, and intended use. + +## License + +EasyDeL is released under the Apache-2.0 license. The license for this model's weights may differ; please consult the original repository. + +## Citation + +```bibtex +@misc{Zare Chavoshi_2023, + title={EasyDeL: An open-source library for enhancing and streamlining the training process of machine learning models}, + url={https://github.com/erfanzar/EasyDeL}, + author={Zare Chavoshi, Erfan}, + year={2023} +} +``` diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..1bad6a0f648dccdbec523ca79ba90fbcfc806af0 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,93 @@ +{{- bos_token }} +{%- if custom_tools is defined %} + {%- set tools = custom_tools %} +{%- endif %} +{%- if not tools_in_user_message is defined %} + {%- set tools_in_user_message = true %} +{%- endif %} +{%- if not date_string is defined %} + {%- if strftime_now is defined %} + {%- set date_string = strftime_now("%d %b %Y") %} + {%- else %} + {%- set date_string = "26 Jul 2024" %} + {%- endif %} +{%- endif %} +{%- if not tools is defined %} + {%- set tools = none %} +{%- endif %} + +{#- This block extracts the system message, so we can slot it into the right place. #} +{%- if messages[0]['role'] == 'system' %} + {%- set system_message = messages[0]['content']|trim %} + {%- set messages = messages[1:] %} +{%- else %} + {%- set system_message = "" %} +{%- endif %} + +{#- System message #} +{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} +{%- if tools is not none %} + {{- "Environment: ipython\n" }} +{%- endif %} +{{- "Cutting Knowledge Date: December 2023\n" }} +{{- "Today Date: " + date_string + "\n\n" }} +{%- if tools is not none and not tools_in_user_message %} + {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} + {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} + {{- "Do not use variables.\n\n" }} + {%- for t in tools %} + {{- t | tojson(indent=4) }} + {{- "\n\n" }} + {%- endfor %} +{%- endif %} +{{- system_message }} +{{- "<|eot_id|>" }} + +{#- Custom tools are passed in a user message with some extra guidance #} +{%- if tools_in_user_message and not tools is none %} + {#- Extract the first user message so we can plug it in here #} + {%- if messages | length != 0 %} + {%- set first_user_message = messages[0]['content']|trim %} + {%- set messages = messages[1:] %} + {%- else %} + {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} +{%- endif %} + {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} + {{- "Given the following functions, please respond with a JSON for a function call " }} + {{- "with its proper arguments that best answers the given prompt.\n\n" }} + {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} + {{- "Do not use variables.\n\n" }} + {%- for t in tools %} + {{- t | tojson(indent=4) }} + {{- "\n\n" }} + {%- endfor %} + {{- first_user_message + "<|eot_id|>"}} +{%- endif %} + +{%- for message in messages %} + {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} + {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} + {%- elif 'tool_calls' in message %} + {%- if not message.tool_calls|length == 1 %} + {{- raise_exception("This model only supports single tool-calls at once!") }} + {%- endif %} + {%- set tool_call = message.tool_calls[0].function %} + {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} + {{- '{"name": "' + tool_call.name + '", ' }} + {{- '"parameters": ' }} + {{- tool_call.arguments | tojson }} + {{- "}" }} + {{- "<|eot_id|>" }} + {%- elif message.role == "tool" or message.role == "ipython" %} + {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} + {%- if message.content is mapping or message.content is iterable %} + {{- message.content | tojson }} + {%- else %} + {{- message.content }} + {%- endif %} + {{- "<|eot_id|>" }} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} +{%- endif %} diff --git a/checkpoint_metadata.json b/checkpoint_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4c81abf3c5c309666a9c294a96147c020ac6a624 --- /dev/null +++ b/checkpoint_metadata.json @@ -0,0 +1,6 @@ +{ + "timestamp": "2025-12-28T22:37:13.086794", + "custom_metadata": { + "step": 0 + } +} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d65fe3dae6c1674d5c2702181ec300504652e10 --- /dev/null +++ b/config.json @@ -0,0 +1,163 @@ +{ + "_external_rope_config_kwargs": {}, + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "attn_mechanism": "vanilla", + "backend": null, + "bits": null, + "blocksize_b": 1, + "blocksize_k": 128, + "blocksize_q": 128, + "bos_token_id": 128000, + "decode_attn_mechanism": null, + "dtype": "bfloat16", + "easy_method": "train", + "embd_pdrop": 0.0, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "fcm_max_ratio": -1, + "fcm_min_ratio": -1, + "flash_attention_backward_pass_impl": "triton", + "fsdp_is_ep_bound": true, + "gradient_checkpointing": "", + "gradient_checkpointing_targets": null, + "hardware_abstraction": false, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 3072, + "initializer_range": 0.02, + "intermediate_size": 8192, + "kv_cache_quantization_config": null, + "kv_cache_sharding_sequence_axis_name": "sp", + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "moe_force_xla_gmm": false, + "moe_method": "fused_moe", + "moe_tiling_size_batch": 4, + "moe_tiling_size_dim": 128, + "moe_tiling_size_seqlen": 128, + "num_attention_heads": 24, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "number_rep_kv": 1, + "operation_configs": null, + "pallas_k_block_size": 128, + "pallas_m_block_size": 128, + "pallas_n_block_size": 128, + "partition_axis": { + "attention_dim_axis": null, + "attention_kv_dim_axis": null, + "batch_axis": [ + "fsdp", + "dp" + ], + "bias_head_sequence_axis": null, + "bias_key_sequence_axis": null, + "data_parallel_axis": "dp", + "decode_attention_dim_axis": null, + "decode_attention_kv_dim_axis": null, + "decode_batch_axis": [ + "fsdp", + "dp" + ], + "decode_head_axis": "tp", + "decode_key_sequence_axis": "sp", + "decode_kv_head_axis": "tp", + "decode_query_sequence_axis": null, + "expert_axis": "ep", + "expert_gate_axis": null, + "expert_parallel_axis": "ep", + "fully_sharded_data_parallel_axis": "fsdp", + "head_axis": "tp", + "hidden_state_axis": "tp", + "key_sequence_axis": "sp", + "kv_head_axis": "tp", + "mlp_intermediate_axis": "tp", + "query_sequence_axis": "sp", + "sequence_axis": "sp", + "sequence_parallel_axis": "sp", + "tensor_parallel_axis": "tp", + "vocab_axis": "tp" + }, + "platform": null, + "precompute_masks": true, + "pretraining_tp": 1, + "quantization_config": null, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "scan_attention_layers": false, + "scan_layers": false, + "scan_mlp_chunk_size": 1024, + "scan_ring_attention": true, + "sequence_axis_name": "sp", + "sharding_axis_dims": [ + 1, + -1, + 1, + 1, + 1 + ], + "sharding_axis_names": [ + "dp", + "fsdp", + "ep", + "tp", + "sp" + ], + "sharding_dcn_axis_dims": null, + "sp_is_ep_bound": true, + "tie_word_embeddings": true, + "transformers_version": "4.57.3", + "use_cache": true, + "use_expert_tensor_mode": false, + "use_ring_of_experts": false, + "use_scan_mlp": false, + "use_sharded_kv_caching": false, + "use_sharding_constraint": false, + "vocab_size": 128256 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..053ba37d35fa3f4c31eda32128d100783a4d1fa6 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,13 @@ +{ + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.57.3", + "trust_remote_code": false +} diff --git a/model/model/embed_tokens/embedding/.zarray b/model/model/embed_tokens/embedding/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..5ac17d100cbf35b5e3b4464fbbcd4d8c08fab06b --- /dev/null +++ b/model/model/embed_tokens/embedding/.zarray @@ -0,0 +1 @@ +{"chunks":[32064,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[128256,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/embed_tokens/embedding/0.0 b/model/model/embed_tokens/embedding/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e5224df982b76e7032f68aa30c1b8ce2eddb8a03 --- /dev/null +++ b/model/model/embed_tokens/embedding/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8db8bd20deeaec8b980c8ae37aa6cd5c5d0fa70830e623d8477e8dfa9a78e3 +size 153553211 diff --git a/model/model/embed_tokens/embedding/1.0 b/model/model/embed_tokens/embedding/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8dca47fee64199c286784a496e3e5e637ca18654 --- /dev/null +++ b/model/model/embed_tokens/embedding/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897aeb79d84bd752a1529bf81b3d29478e34d3e9ebf6a8cd7b2fe0f0e497baee +size 153582249 diff --git a/model/model/embed_tokens/embedding/2.0 b/model/model/embed_tokens/embedding/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5eeed93f690508dd79fff1c29bf43b5c82259100 --- /dev/null +++ b/model/model/embed_tokens/embedding/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3743db21822a6eca2489bc2f56f737b98ec935b01da4ec03944bd5d306197ba3 +size 153605814 diff --git a/model/model/embed_tokens/embedding/3.0 b/model/model/embed_tokens/embedding/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6adf1c292bf86bba0695b1d828fe38c1101c52b2 --- /dev/null +++ b/model/model/embed_tokens/embedding/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:681f7aed511ada5f0e5e68d9e56b807d951a8f0b4befe7d121d5ba030224a5c5 +size 152474395 diff --git a/model/model/layers/0/input_layernorm/kernel/.zarray b/model/model/layers/0/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/0/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/input_layernorm/kernel/0 b/model/model/layers/0/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..68f128bd244ee81c0d43db270619c79345931426 Binary files /dev/null and b/model/model/layers/0/input_layernorm/kernel/0 differ diff --git a/model/model/layers/0/mlp/down_proj/kernel/.zarray b/model/model/layers/0/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.0 b/model/model/layers/0/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f05289736265aae961d2a86775f1b743942cc5fd --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47b9bfb0ee6e7c654c9c2a9f2f8649d55600974f6cc2591b427de75905bc8c9 +size 9793994 diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.1 b/model/model/layers/0/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..04ea84e2b29b36f355b7d53830698596cab4c3d8 --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae3f28c244b23e04cc59266d9f9fe296eadfe4f1d65e74f63507003f3896a12 +size 9794191 diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.2 b/model/model/layers/0/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..1d17762c898c8218f694d1de1ea95292eb7f77ab --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67859b4d82182869afd5ca4a83d449768515c6a5c664a73c098f2f5eb66228f7 +size 9790983 diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.3 b/model/model/layers/0/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..63a03e2b8b7e2be761ba9d6010b00a80b7e3ec45 --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceea5feef5424d5c1767dd262f0dc476fb8ab12a22fb7348cc4dac16406a83c6 +size 9792322 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/.zarray b/model/model/layers/0/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/mlp/gate_proj/kernel/0.0 b/model/model/layers/0/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f4df616b0c6acc31c798e5fed71ba05a27e781fc --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe037f40aed0c1446c92d1315d2e322894465257254ac62b80141d6623bb055 +size 9796524 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/1.0 b/model/model/layers/0/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..af65168427b3fab084a6fadb9afe47bf60fb9d3c --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36f4357f2b8d23a49d2c7d1fc6e25cfd5eadf5ffbea52e3a103ada3bab090ba +size 9795376 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/2.0 b/model/model/layers/0/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee9dc263139f01ea9074506ab69e3491785b574d --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41794e257f366a9e39627ffda32d8db572e729c46777ffc8e8c566d8f820b4ac +size 9797415 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/3.0 b/model/model/layers/0/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6494e30412dcb02933a87f90c1e2e549a0a3f162 --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64adc7dc68277ee99a72e49e4b862e9d7244aa709bb56bd193623e22738d6be +size 9796042 diff --git a/model/model/layers/0/mlp/up_proj/kernel/.zarray b/model/model/layers/0/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/mlp/up_proj/kernel/0.0 b/model/model/layers/0/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a09165c105fc0d5fbedb3a2f7cb62ef5db843a19 --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0746c3241577837ad26bb8ebd2326da9e38c0366c310cd1aa36c644940f1f8e6 +size 9792876 diff --git a/model/model/layers/0/mlp/up_proj/kernel/1.0 b/model/model/layers/0/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..be1cc06fbb53a296f796ad5cf952bdb091fbf726 --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb7e6ca1c55e609a0cad20db51a8ee0e8c271fa9d6663f480396bd0a7ab6688 +size 9791805 diff --git a/model/model/layers/0/mlp/up_proj/kernel/2.0 b/model/model/layers/0/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..aee5da17180d26fb3359f4444df176866607fc73 --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0995800479b3f2626cabfa156300a63f86a53e371d728e753c22a7ef2d77d1 +size 9794440 diff --git a/model/model/layers/0/mlp/up_proj/kernel/3.0 b/model/model/layers/0/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2670d67aee7ea872c10978fabd2c6c983184d653 --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe64d39a64d1a6d94855294f455bb76bbc7e6f24d953a9ff18a67d4486284cf +size 9793131 diff --git a/model/model/layers/0/post_attention_layernorm/kernel/.zarray b/model/model/layers/0/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/0/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/post_attention_layernorm/kernel/0 b/model/model/layers/0/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..917499717ff405f853c30932eda86a7e8007bc1b Binary files /dev/null and b/model/model/layers/0/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/0/self_attn/k_proj/kernel/.zarray b/model/model/layers/0/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/k_proj/kernel/0.0 b/model/model/layers/0/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..71bd8463b86915d393fcc33b455b4f69fa4adef0 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579517a24755958c87b96f74c4c680c5333e07c17f55646a078a4cc752f2100e +size 1252588 diff --git a/model/model/layers/0/self_attn/k_proj/kernel/1.0 b/model/model/layers/0/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..03928d38ae790c45abb91fedeb3b0b59c8035bdc --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b660a00120b2df24ab4992b7896c8024e60e2722764873809395581fb198d9 +size 1253220 diff --git a/model/model/layers/0/self_attn/k_proj/kernel/2.0 b/model/model/layers/0/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..13b55da19e18f49154728703a5430fdbc3ff6858 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d135941603ce0b4f9986d30376fe2f50644ca5c617f28644dd6347e38e97cbb +size 1252977 diff --git a/model/model/layers/0/self_attn/k_proj/kernel/3.0 b/model/model/layers/0/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cbb5e6f5525c744389cdf2b2919720fed2b89b8d --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebee806dc09c7d899f997b002259690751a2f99e1ffa333c94183ff93028fc54 +size 1250855 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/.zarray b/model/model/layers/0/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.0 b/model/model/layers/0/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..75e53d82752406450173ab7a1312a9cc62310a95 --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd5bae5d43cecc11f61832bb902d9a0bcb4cf41cee21ac887e65be6c346b3a0d +size 3679776 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.1 b/model/model/layers/0/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..f59581233368e295baca332ea23bd6ba16a67730 --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf31fec254143a5d3f8e1cd70a3cc8868c2c70706312c1c4c57f68e0994a7650 +size 3679991 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.2 b/model/model/layers/0/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..9e5a2890eeb1741e5984309f8083e18998c06061 --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1e37b7653fd2586a8b3f603f779cd24d536d1af1d3d30ac5633c7003a52c76 +size 3679503 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.3 b/model/model/layers/0/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..3ee86d90605827acc07562bf288c2e29c9c0736d --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72677052a0fab5a7f22a48befc6f5211f24cdfa420c5b2894dbc111838c2e01 +size 3680553 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/.zarray b/model/model/layers/0/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/q_proj/kernel/0.0 b/model/model/layers/0/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d36dc82ad458311f5e2a34e1875dd5352bc578d5 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d0d6d2171812c7f8e7171649df21d1eee888b8fc6ece3ea531984860303e52 +size 3772558 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/1.0 b/model/model/layers/0/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..db1c5af26f759f3fc1304d3dafe4bde55c9ce4c4 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81ddfb580266bb7b4893000b95b69e04062dc5789686363be1df84ab5213b5d +size 3774141 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/2.0 b/model/model/layers/0/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..98fb1d4f461ce1fde15bb3531913526e8dad5545 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7b6d1c5632f78b9e5d1e973edd72aa6a9c898a312c9b96d71b03d4323e5d72 +size 3769330 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/3.0 b/model/model/layers/0/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..fa01da8809353110d91c4ad253de63a898bf4fe3 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:682cb995acecc7700339b9d665191b086e719e3f6b040ae072a2c78d258e956f +size 3762911 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/.zarray b/model/model/layers/0/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/v_proj/kernel/0.0 b/model/model/layers/0/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac02699e275fe253bf71d2c24ab7d6167b3ea50b --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0688e594d8cfb76c01ec5ef3bd86fa1316ce52017eb6f865abd503d16c5acb37 +size 1249107 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/1.0 b/model/model/layers/0/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ece691253b7892aab19e5f87e96e8d888fd8df85 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d4eb7b216cfb5fa6ee1db83a58176c2f75cfd7649ad4ba11735e5592b00fc84 +size 1249709 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/2.0 b/model/model/layers/0/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..09b9a7731e7e3cad51546feba4e1e802b89d9e71 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a736c89e062ca686f4de6087bd5b68c49af1648552fac9bca8180783be38760 +size 1249755 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/3.0 b/model/model/layers/0/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..42c15212f85282aff04fe60f9e2f0088f14d3fe6 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e93401a827022d5dc37d7164b922a617cdd8e5859c9c240e649220fefbfb54 +size 1247987 diff --git a/model/model/layers/1/input_layernorm/kernel/.zarray b/model/model/layers/1/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/1/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/input_layernorm/kernel/0 b/model/model/layers/1/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f82cff7a8806bebddea11c6aac19393b795bca80 Binary files /dev/null and b/model/model/layers/1/input_layernorm/kernel/0 differ diff --git a/model/model/layers/1/mlp/down_proj/kernel/.zarray b/model/model/layers/1/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.0 b/model/model/layers/1/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1fe54e0fc3ae187f8261e80fb5dd534c779343a7 --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51400b9d4f34efa82c944f85f94bcf173537dfadb0be663e73e112b85f157d76 +size 9791929 diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.1 b/model/model/layers/1/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fa8e873f5db8f074b78f911b34b26a2b61afed97 --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b0a06379900cf60bc61d4dc9d2d73879397882bf794726d37e3ebaad3edb80 +size 9792708 diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.2 b/model/model/layers/1/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..95c3f54951364c80a42debf81b626e7696720baf --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d294080274e59bb11a60d606a40d666699d78201dcd06d54305fdd44b026eb +size 9791918 diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.3 b/model/model/layers/1/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..8e010f9c3c9e2664846cb0c9015dec5f49af2ad8 --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b2c56e70dee033a2cbeecf039cd57345105cec9b32285024f3e214a1667e14a +size 9792057 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/.zarray b/model/model/layers/1/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/mlp/gate_proj/kernel/0.0 b/model/model/layers/1/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..825adf47f2e4d4636206042c5de4fe2f1391205c --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc28027115019af35675ed4d3dbb6a99785cb33745b3d0b0fa2d1e6bd020b8da +size 9803142 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/1.0 b/model/model/layers/1/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..308f9dbcf9b8cac66152fbe503b079b7ac1cf294 --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17975d4bb00929a56e3d6cb3acc29e1a8212febe4b4190f6b198f5ed96e25132 +size 9805027 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/2.0 b/model/model/layers/1/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5e84f2eb92a51352fcd8fb425fd757139b4283bd --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3caad9f967d139b572582b3cb11fac655b93a1b1984148faa2d6b9673f1a7b5 +size 9801427 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/3.0 b/model/model/layers/1/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9b4ed8639fd015d9905984788a90659aa4747cbb --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f632b68b2abb786486a18c7af7d30334a52a671e02b2f0a56db12b4c607f33d8 +size 9801772 diff --git a/model/model/layers/1/mlp/up_proj/kernel/.zarray b/model/model/layers/1/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/mlp/up_proj/kernel/0.0 b/model/model/layers/1/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3dab0bbea9a7beab0c8efa52c5438f8106a5a39e --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc35e5512381f1348e5d926eb4a38ca4c4e77d418e9b81bd312446b01ef5967 +size 9796347 diff --git a/model/model/layers/1/mlp/up_proj/kernel/1.0 b/model/model/layers/1/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9735874c272dbbf41ad7def68c109a4f32fd8acc --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc625a080fc57e99de105e0dfb9a0fb9ffd884335661996f50e73319ec970985 +size 9798402 diff --git a/model/model/layers/1/mlp/up_proj/kernel/2.0 b/model/model/layers/1/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d1ce816202bc514f4cdaed120b58fd35119ecbe --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f2d270eb00e562498942e8000adb7f696217062d008f92f0d2c58b6656e5206 +size 9795255 diff --git a/model/model/layers/1/mlp/up_proj/kernel/3.0 b/model/model/layers/1/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5db3c9177aa52e04086f43126b10fbce5d6ae8a4 --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a42641264059d3ab49d22be9742949094c9244b78e8a293305c588cfc76cebe +size 9795943 diff --git a/model/model/layers/1/post_attention_layernorm/kernel/.zarray b/model/model/layers/1/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/1/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/post_attention_layernorm/kernel/0 b/model/model/layers/1/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..b86fc7e395678bc7212c9e998314d094671328f6 Binary files /dev/null and b/model/model/layers/1/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/1/self_attn/k_proj/kernel/.zarray b/model/model/layers/1/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/k_proj/kernel/0.0 b/model/model/layers/1/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e5438fbc3c45d4ce8439c0e1721a08c0b44e8bab --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3810e1c1830093a0cdd69884f5ac927c9b3e1e73b2ab45168873ad8a1a0ac0ff +size 1246164 diff --git a/model/model/layers/1/self_attn/k_proj/kernel/1.0 b/model/model/layers/1/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d1f224aca73387dbb3e6abf7cfc879866bbff837 --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa03deb6bc6511b4c4f26aae01ff0dd72bada0a772e4b4d5dd9205a3879683b +size 1246941 diff --git a/model/model/layers/1/self_attn/k_proj/kernel/2.0 b/model/model/layers/1/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d122df15504e3da0ac552b3bbbff2fa1e3d51fda --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd228b1a6df0127cc1d34fefa0d2aa8faa8be3109af93a9242fa3bb54a8a83c +size 1246078 diff --git a/model/model/layers/1/self_attn/k_proj/kernel/3.0 b/model/model/layers/1/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1e9fd125606d05474c2faad11f7c823e2949d913 --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96eb75d839ce42894d4ea851d44faec2171f9097a748f56f14a2955a2c3c54a8 +size 1246133 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/.zarray b/model/model/layers/1/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.0 b/model/model/layers/1/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..829a65b7856cd207ce2043f5ec4082768b9dadbb --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88a3f6194993c88f7805d0e598d08fb812a6467c431a9be022a333ee8424c6e3 +size 3673749 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.1 b/model/model/layers/1/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..8272f059fac099357f8c1bd52f2d9b7092f1eca4 --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f502ac524dfb294ece6dd77116fc9cbeed611ba069f1a78bf752895d8ed98776 +size 3673980 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.2 b/model/model/layers/1/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..8389ff641c6eded63d806ee9e2ca845698a1317b --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b79ab5372f0780124b4027811f9f4bf76f4921d7c9c0e932056176497d50baab +size 3673425 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.3 b/model/model/layers/1/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..81d2c47beb5e74cdfad42d7e0b4b82154b4b9c86 --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b20ba3165fd486dd8ba89b22195aad91526058f6b17eac7cb32c796d93e005 +size 3674198 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/.zarray b/model/model/layers/1/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/q_proj/kernel/0.0 b/model/model/layers/1/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..61abf2d3fd8e390b42bea67c30a13e12fd1d71d5 --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c842054174d8a7fb589bfa71a989127dcbedab0a5ab7967d45fbdf882e6af808 +size 3731738 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/1.0 b/model/model/layers/1/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec1b561ebd585d7908b626543eec72b59d203adc --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56fb0f8087f2e2f94c077bcf9f020159a32548d05e2c5eb52fc5654ed43abfc +size 3734483 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/2.0 b/model/model/layers/1/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a5651be7e85afca7cd16c55686695cbd3fb8a853 --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6564073c1752c0edcb1c7db142e69e39735fcb1c81e2040dc44af5d6fffe5e29 +size 3730627 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/3.0 b/model/model/layers/1/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..7eabcd109bc76e3c80aeb29d8e700195685bb7cc --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9b3bf205f01474c4f4fa9bc9982af347d35a46ad6cadcebb618a9a1e5a6615 +size 3732523 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/.zarray b/model/model/layers/1/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/v_proj/kernel/0.0 b/model/model/layers/1/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..382a2004b227aa5d17cc59a91e4d713ac9798680 --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0437964c90da86b52a636477a081868e5ba478348b5471f690a9d65b1e648b +size 1228005 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/1.0 b/model/model/layers/1/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..784a93900e19329773eed014930d7389c0adf8f1 --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ad2e2709c1db5a1ce692b09966a95fa5d80206f14c2dcf1a100752054f756b +size 1228391 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/2.0 b/model/model/layers/1/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a0cb33d0327318cb94b6a9953149574b2bb9d7f7 --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3426f743900bb8a704fec18b6eb63094ff7798820dd69572a2a6ec3282a5cae +size 1228233 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/3.0 b/model/model/layers/1/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d3e1b38642c4cbcb1ddca64b0ee6357f7cae7c0d --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5960013ec38a7ac1676326621ae09389d4b5aaa5f31287fcb549a6a3d15fc74c +size 1228466 diff --git a/model/model/layers/10/input_layernorm/kernel/.zarray b/model/model/layers/10/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/10/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/input_layernorm/kernel/0 b/model/model/layers/10/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..108f5d3a47d52106d38bc2ca42e600d068c7a859 Binary files /dev/null and b/model/model/layers/10/input_layernorm/kernel/0 differ diff --git a/model/model/layers/10/mlp/down_proj/kernel/.zarray b/model/model/layers/10/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.0 b/model/model/layers/10/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d78729d604f06411ab6fb7f0d59e5397a6a49768 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:474f5e7b9effa28d8778dddd8f03f772fc51b76012681149328b6381d1e0978b +size 9811483 diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.1 b/model/model/layers/10/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..381cf6e60491c541fd8ae3903caec86a69eb5a73 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6950b5312cdf680baf84ecee0ee2dbe216cd3470b1dc92a089defde9baf779c +size 9813107 diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.2 b/model/model/layers/10/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..62e070efb14885eebecf647dfc54f7abbc7def20 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9e138418eda3cd50797129a218c6b617c3770167414824c490d0416b24caea +size 9809359 diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.3 b/model/model/layers/10/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..4907bdd02ad705d76779e6cee32f8da5c73a6ebf --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:020283a0a0cbf3a3031eb02f31fd7c7eb1bc8c3987abee6270566a2d99e17444 +size 9811724 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/.zarray b/model/model/layers/10/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/mlp/gate_proj/kernel/0.0 b/model/model/layers/10/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..056789143ac6f443706ce31a78c1eb7f9dc27d21 --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d730589b14aaf10f40915927ce6f929adcfec8dc1b1e5767b4dad99de26cd8a +size 9814280 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/1.0 b/model/model/layers/10/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..03a9c781bd72ef271bf69df0fc94366c3d9e1bf8 --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b567932e922a2172fb309035a52d329ebe3bc93751240c04cb9b25a823c3e56 +size 9815151 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/2.0 b/model/model/layers/10/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..7671dee460292913ad130ec53d131d2b87a08a7c --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b28db78594286f7116f6f0eedf434fd5961e57f1f168ba61659071cdca7ed0c8 +size 9814926 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/3.0 b/model/model/layers/10/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8fa2239e854ef4d248fb57c9e6df39323f354595 --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c14bc7566fa06c9a360e6893c3556683102b6d5ec51a109e8e76b4839aeb168 +size 9813043 diff --git a/model/model/layers/10/mlp/up_proj/kernel/.zarray b/model/model/layers/10/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/mlp/up_proj/kernel/0.0 b/model/model/layers/10/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2129746e4bae64dfc8045f2629a4db549596fa11 --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a02d170f515c66b21b2b19a9ad9bba70a068f9ef7e9390172e0a4f81905022e +size 9801386 diff --git a/model/model/layers/10/mlp/up_proj/kernel/1.0 b/model/model/layers/10/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f416062274dbbaef6ff0b045b4a2d9f0ef8baf63 --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9624fd72973d9b2acbf3f22458fbb37760aea12308e8a99205c085a54c43013 +size 9802328 diff --git a/model/model/layers/10/mlp/up_proj/kernel/2.0 b/model/model/layers/10/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..486c91b3cdfd275dab53186b09ab8ccbf67bd32b --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced798408508c27fa3698a7368760c98e1ad1d3abe65464687d1d57ccbd5dbc4 +size 9801901 diff --git a/model/model/layers/10/mlp/up_proj/kernel/3.0 b/model/model/layers/10/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..834425f82983bc95be33e6636ebe65014cc4365e --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5829e1ddc90b80cfa1075be7a8924d9a7cd4b75c334d519fca2b39d2705f3a +size 9799640 diff --git a/model/model/layers/10/post_attention_layernorm/kernel/.zarray b/model/model/layers/10/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/10/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/post_attention_layernorm/kernel/0 b/model/model/layers/10/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..888d1ff277e52424ab5ff937dfe92a2f71a6a941 Binary files /dev/null and b/model/model/layers/10/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/10/self_attn/k_proj/kernel/.zarray b/model/model/layers/10/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/k_proj/kernel/0.0 b/model/model/layers/10/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..61c597ea3821a38862c99e3cb2a55c4ab5ba1bc6 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63254653e8145afc2399c0160525536e46023e1ca7c32832fbf15ec62010cd1 +size 1234838 diff --git a/model/model/layers/10/self_attn/k_proj/kernel/1.0 b/model/model/layers/10/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..dcc9453a9258bbe8f994d2feed7dfad49109ba0b --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa45c7f60d3d8a5e27af8275a34e0ad88b13bdbb903dbe400a3c28f765723223 +size 1235051 diff --git a/model/model/layers/10/self_attn/k_proj/kernel/2.0 b/model/model/layers/10/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..517f40a77dd089be02bb86a6284e21888e42b4c8 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12bdf741c2edb0132271c1cef553f99227bada4d336725199c04711b26c3a0d +size 1234908 diff --git a/model/model/layers/10/self_attn/k_proj/kernel/3.0 b/model/model/layers/10/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1fd5f9928c1014f2d927a4fcf4bee8fa86624683 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e157ffd040bd64e5b1da0f7884c89ad49e8f4a861e43d1ad13e577f142ee2c +size 1235004 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/.zarray b/model/model/layers/10/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.0 b/model/model/layers/10/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5ca22a745475f04060d586fc1aaf01cacf926ce1 --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8c730f003499822d8d32cb5c4bbed996b9984bbab80a2337039e7b30919949 +size 3674829 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.1 b/model/model/layers/10/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fa579fcc330cb9d43653e6459ec59d0110302eaa --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2285bcc89f6e43e6ce7bc99d66b2dca125f8b35a9cb260960963175360506df1 +size 3675643 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.2 b/model/model/layers/10/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..4ff177b38d4a3a8438d41f285a5e4fe2ae19eb09 --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354a7ac91341c5663245830f1c119622c8d39813e6f2c9a6bb0d5f0771202f1a +size 3673387 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.3 b/model/model/layers/10/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..100e9b2d76ab5696aecf10f32084d3e024b5e8b8 --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0448391b58c9698ac938ec99e8b8d51aba492b30a158cb1f769a5f911d0a6fec +size 3674202 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/.zarray b/model/model/layers/10/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/q_proj/kernel/0.0 b/model/model/layers/10/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1544e88d8197517b25a7e9edca03fa3e18425e2f --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f5844bd000da795ffb7e810c7ececb3f6caa29804cc71747a2052cfec07399 +size 3700636 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/1.0 b/model/model/layers/10/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e06fd55d8813f653d699c8ee6d99a2922779ef7d --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e6f07c1092aee4fb2ac60ef80f108daf81f04bec07559ad29a394b97203a19e +size 3700551 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/2.0 b/model/model/layers/10/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..943e2346bcf28207615270f5c5dc92a3e7033967 --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25a7f2b17f151ff1f3a3313e9ca73ab9e54914e4325314974a6c05ec8527da8 +size 3700149 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/3.0 b/model/model/layers/10/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..07daf9a0dc07a619eeb725f5f2f8ffa3cf03f835 --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c2ac954319293cfc00b5fb96658439597355fdcccb4333a694fe7204169bfeb +size 3700510 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/.zarray b/model/model/layers/10/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/v_proj/kernel/0.0 b/model/model/layers/10/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..68bec36cb9a0bbd5a006a046d24614e53dc265a2 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71daf110a930334a1ccf2eb563fcdf4607ce88dfefa3aee65e763945b22c27b +size 1226584 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/1.0 b/model/model/layers/10/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8a660a1ccc2d27f5b7e58ccfab0b3634d7a14455 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e28efafe6df224b7435eb8b4da3e8ec3975d58ef11d49f4b47d2d8ae0c7792 +size 1226248 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/2.0 b/model/model/layers/10/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e87ded25f673956e950717c2cd2c7875ef69b443 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b4e28e9f0f19db15243c9b4ad6c3fff1329ff230c832f9ed777994fde8518b +size 1226586 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/3.0 b/model/model/layers/10/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..05ec07030188678912d75054870bdc92d4ecaec8 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458ea1ae818f0a5021477c7f98f2ebf26f730ac275a602795a7e463e6472aea7 +size 1225446 diff --git a/model/model/layers/11/input_layernorm/kernel/.zarray b/model/model/layers/11/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/11/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/input_layernorm/kernel/0 b/model/model/layers/11/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..c38afd53c795777ace87449c300c00e9d539b9dd Binary files /dev/null and b/model/model/layers/11/input_layernorm/kernel/0 differ diff --git a/model/model/layers/11/mlp/down_proj/kernel/.zarray b/model/model/layers/11/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.0 b/model/model/layers/11/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2ca9efb0fffa40fabe842172c501ac70f8155ab --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36f8036b418ad38f363d6d562c62f314c2014a6cb852fb5b1d9aec5737aa8fd +size 9809090 diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.1 b/model/model/layers/11/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..baae675f64314f770cb0a3267cae668db090b640 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98d8a504ba8fa5a19db21161c26724279d86f76ccc20c8b71d1165670e4b3f9 +size 9810528 diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.2 b/model/model/layers/11/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..8a2c3d53653280037789d031c2523c6b47379fe3 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a28f2a7176f8392c27215547a975b5b0ac124a62030fc1840325cae83ae08da +size 9807750 diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.3 b/model/model/layers/11/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..8aa3167a5e1c428722ace1bf1116a9d2e6f61820 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b733d26a3d754516bb523259b9519e5a79dc290b2d865cd53200e106c34ed86 +size 9809312 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/.zarray b/model/model/layers/11/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/mlp/gate_proj/kernel/0.0 b/model/model/layers/11/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..85d07b784ff5e2210052dc5dad9e15d1368276d8 --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae64c8a734ad20f7922220a6a14eb928416dd40b5015d391e4ded3da665362d1 +size 9819770 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/1.0 b/model/model/layers/11/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ff3a4d292db6f8d28a60885c61ff8af2a135b27 --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387a2aaaca3facdd7e00254c17a83c8ce1b5d7623a35ae1328e73a0a81ea968b +size 9821100 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/2.0 b/model/model/layers/11/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ddcce255dde5cd2d1ec6851f1cd85316344f0b8 --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:878fe0c963218ead1b6300b1e87390a06d6d7334eda7e699cf4d681d3ed576f0 +size 9819351 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/3.0 b/model/model/layers/11/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..11ce8f27308febbc2c4535e67dcb1f12cb50ae35 --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f7c6d454eba5aca634a948102d9906b3c345e615cb45cd5af519a20086a564 +size 9818902 diff --git a/model/model/layers/11/mlp/up_proj/kernel/.zarray b/model/model/layers/11/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/mlp/up_proj/kernel/0.0 b/model/model/layers/11/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fda96d1195905af78dcb80fa6c1d3aaf36114371 --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf7797eca61d832980f28b353e1b4d970ac81500ec6eaecc85980ad968fdb5c +size 9805378 diff --git a/model/model/layers/11/mlp/up_proj/kernel/1.0 b/model/model/layers/11/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a117bfb2d3b3a9fcc7d960a72ced04bff1c727ba --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4dcc040da813e44b289258f1b1eed9b088245999953bb0ead402ba010377aa4 +size 9806630 diff --git a/model/model/layers/11/mlp/up_proj/kernel/2.0 b/model/model/layers/11/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ba75715a011d6903e0c25684cee79d38f8febbe --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:870713665c82a10f7e3c73affdb1abb19f0471b464f3ed6347c5d6dc9804eed9 +size 9806776 diff --git a/model/model/layers/11/mlp/up_proj/kernel/3.0 b/model/model/layers/11/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8f8c9755d72fa6cc183a71867e71443432094579 --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec1bc706b343f6ed22ec2968e10e7fa756ec70d1a12e3a898edefb43f7ffe1b +size 9804759 diff --git a/model/model/layers/11/post_attention_layernorm/kernel/.zarray b/model/model/layers/11/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/11/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/post_attention_layernorm/kernel/0 b/model/model/layers/11/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..2c9fa77f3c2f06e013996547b4304b3cc6d4ba9d Binary files /dev/null and b/model/model/layers/11/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/11/self_attn/k_proj/kernel/.zarray b/model/model/layers/11/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/k_proj/kernel/0.0 b/model/model/layers/11/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6465b7c96f2f8ec409a18d51f46ac01a08662307 --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f1e7b8f31d81ae7c9d38c0fd1218d1c1c9a0dfc3b557983c141c15e1bf17a00 +size 1232257 diff --git a/model/model/layers/11/self_attn/k_proj/kernel/1.0 b/model/model/layers/11/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a325fce03f3b6a255beb003ba81a25184a583204 --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ace34cf0e017e111bb79ea76c3cccc12558e4336415633decdecb1f923e753 +size 1232515 diff --git a/model/model/layers/11/self_attn/k_proj/kernel/2.0 b/model/model/layers/11/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..705c2f89767707b954c1856d2fc9c6b1e8310568 --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c82ba19aacd5cf4f00075906d8ab90595ac9693f4e04020851b7c02d2f2df9 +size 1232135 diff --git a/model/model/layers/11/self_attn/k_proj/kernel/3.0 b/model/model/layers/11/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab63e87be1f546107019bf3e004d8e3e62ff4f2d --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0a47e2e50fea902ffd63fd8719795e8bc90df29869f112df6d1d9bcd2bafbe +size 1232293 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/.zarray b/model/model/layers/11/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.0 b/model/model/layers/11/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..106ac15835a3bad7c4f8e6fbf2e18d7d4c1dfb64 --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dec5adc8e1148d23a88469b32ffaabc413a192bb117eb8e7f425e692abbede8 +size 3674238 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.1 b/model/model/layers/11/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..572699d260d541d17c2e94b4cd208dbd4763f066 --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf36aa45c841b89a48b8c8a0360f522c6e491a3b5d7a10976917fe884ffd70be +size 3675009 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.2 b/model/model/layers/11/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..83b10988eee7db94a5c6b02b0e9a93fb06486aef --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5d796cfdf361558a40a66d527983df3e4f8b6412d5aa8e882a593215d98bb4b +size 3673450 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.3 b/model/model/layers/11/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b37ef795e36c846873ff81cc82b6dafd59107ed2 --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c3d73293315072156f8ecf3f86d708223616884d0fa88c792cb935ce8d1742 +size 3673871 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/.zarray b/model/model/layers/11/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/q_proj/kernel/0.0 b/model/model/layers/11/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2adfea1031031cd9459196143e75b14504013bb9 --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d402429de335edd5b6c4b4ea60799e86f53dd9a9e43ab4f04c1071509f5221 +size 3695364 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/1.0 b/model/model/layers/11/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8b67b1a8b9e576253aba0bd3a596e016a7fe1d61 --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c803adc1b1a92a88fda1cd3352b5437b408295717d9909900049e85ccf862e22 +size 3696100 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/2.0 b/model/model/layers/11/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a6cb83f317ee48dc5e00d128a8d54eb2781bb8d --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9cb7524d4c1f5641df397f0ae26df74898d9d66510fd2d459ac5e0e7300ceb +size 3695847 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/3.0 b/model/model/layers/11/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e33d3af0aa55c7cb72366135f265067e1cc0358a --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f5e0eb7eb416427fdfe90abe295a5ddb6effd032c6edddab059b0cb5a5f0e8 +size 3695656 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/.zarray b/model/model/layers/11/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/v_proj/kernel/0.0 b/model/model/layers/11/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..91427cd7aa976bcf348bb740caa2082d29bc7a79 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a068e0b5791566894a770384fc493210fb51f5afd58434477dd60c18813c1cd0 +size 1225252 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/1.0 b/model/model/layers/11/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..367fa9f69885121a861e13c9d2d98714a3152250 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0753d87fe2a4bfdaf948e45b0bf0ca170eede2eb89c9350c024d42e80503fe +size 1225024 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/2.0 b/model/model/layers/11/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf40780fe3ae90b46540a93eb99bb35ee6498b5f --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0162d81978ec06eb3d76cadfef02d849c1033d4437930a1d3ca5d5c4bfa8fb +size 1225442 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/3.0 b/model/model/layers/11/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..813c5448b9ac8239ef33fd5ed93bb61190c20a13 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ab5cef8597420079760e20da0ad902b8f1e5f070e12363881f59242f4cacca +size 1224467 diff --git a/model/model/layers/12/input_layernorm/kernel/.zarray b/model/model/layers/12/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/12/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/input_layernorm/kernel/0 b/model/model/layers/12/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..7e37ef58022309567e6c86b6db84585bbc572e22 Binary files /dev/null and b/model/model/layers/12/input_layernorm/kernel/0 differ diff --git a/model/model/layers/12/mlp/down_proj/kernel/.zarray b/model/model/layers/12/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.0 b/model/model/layers/12/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..71edd9f45b6fcf0e034e16257543b1bfef88dfd0 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a4d4c86e2aeb89534ba7b0e3b9192a92a9d0e42f6514a26933c5888bd129e8 +size 9807925 diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.1 b/model/model/layers/12/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..78e3b813962895ecc090cbd52963c0d10b57552c --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a86e63aeb8fd2f4e075b0edc19aa000716a310138842797c1d1e8ef088f4010 +size 9809358 diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.2 b/model/model/layers/12/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..bc635a153d8f948fff620fa173f64d76d8d2d075 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3984d5e5b3b92a76fe9b36c2c59d0680b685f95842fc09848fc9022329fd1fa +size 9807502 diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.3 b/model/model/layers/12/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..bdf53a72351df3f2b1b16e41d714f683dc0d9615 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:931217576318ed7852c9e109757d3f804b5c90cf53d8f0b35c678eadf7cdd863 +size 9809057 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/.zarray b/model/model/layers/12/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/mlp/gate_proj/kernel/0.0 b/model/model/layers/12/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..40877387290f298ebbeab7a64778d98876c917ad --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f922b066315e042b373fef82d93f94cb8e6a32331d64d5f7ecd44c25a525dd68 +size 9814077 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/1.0 b/model/model/layers/12/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c9a755ed73d90811aae80ac961d1bd8c9fb9e5a0 --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:791f6a0a436d80f86a1ed7842e10c65d578e9a911f2cf4dee1630a1e0e43af33 +size 9814788 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/2.0 b/model/model/layers/12/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..45d0e3a315ab268bb59643d10f05a11f1e9f7943 --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6bf856e23f748d7f72b83320ebeeaaf15b242772d6f57328f8c6fc5f74ab2c2 +size 9813361 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/3.0 b/model/model/layers/12/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..158f9477651b4b305825d3e17b8c877120b48c09 --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c66c56bddaee52c93881fc8c7ed4ceb3f588195a49ae4733a5af81f8392944 +size 9813488 diff --git a/model/model/layers/12/mlp/up_proj/kernel/.zarray b/model/model/layers/12/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/mlp/up_proj/kernel/0.0 b/model/model/layers/12/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2a6ec46acbdd883f980e0a7d66944798d893cb55 --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dcd3ed6be2fd2b199741f7451187c64cbd3a93b78128c561360189061c2b0be +size 9806820 diff --git a/model/model/layers/12/mlp/up_proj/kernel/1.0 b/model/model/layers/12/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe5ef39605fee6b607285ebb4f9df662d8bbcc09 --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118f6188f3b30c788781665fc0619d594866e7d811f0c3292277ec36408f7768 +size 9807939 diff --git a/model/model/layers/12/mlp/up_proj/kernel/2.0 b/model/model/layers/12/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..34085393c444cdb718d9c437aa3e1dae547c8c32 --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6099efbdcf05fd94449ee02943e72a1fbd86fd0ad248f004d7528a708a9fc5ea +size 9806867 diff --git a/model/model/layers/12/mlp/up_proj/kernel/3.0 b/model/model/layers/12/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2b78cc10548d2fa226f5195f60ee411d937a405f --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:333d054a28722dfd0ddf2edb4567e31efd4659582c3322eacaad533c7c3fc0a9 +size 9804493 diff --git a/model/model/layers/12/post_attention_layernorm/kernel/.zarray b/model/model/layers/12/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/12/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/post_attention_layernorm/kernel/0 b/model/model/layers/12/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..b507133abedc3c0c295ce687c13338db14037be8 Binary files /dev/null and b/model/model/layers/12/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/12/self_attn/k_proj/kernel/.zarray b/model/model/layers/12/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/k_proj/kernel/0.0 b/model/model/layers/12/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..842a9d1e0bb3f920962f6880e7033afcd836f63a --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325328f6cb8b5e44f407f18faeadd7ef5e565930d85394667efdda7226f928e1 +size 1234898 diff --git a/model/model/layers/12/self_attn/k_proj/kernel/1.0 b/model/model/layers/12/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a954b66178db0ab89d50dbb323d68062e6d1ab0 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c59ec4d22afd32179ccbc65f6653a98dc18f05f25d52d6baa501133bfdfc056 +size 1234972 diff --git a/model/model/layers/12/self_attn/k_proj/kernel/2.0 b/model/model/layers/12/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..780cca6cbfed08ed64e942a005caab6a9fbc1924 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68bd3d73c524b903c778ac5305cc3513443562a9467d9280263ccaaf1054d37 +size 1234887 diff --git a/model/model/layers/12/self_attn/k_proj/kernel/3.0 b/model/model/layers/12/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..928d4cefcb1c6bc8777d7b54b89cc994e6636b46 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32821f7b54057985707d8c332c0522b169d0daee4741d5d16e2a38e40e538f3c +size 1234958 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/.zarray b/model/model/layers/12/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.0 b/model/model/layers/12/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f1488906e6e38d5a2fd6298ca8bdb7a0c3dfe261 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df995d98b367cb048325a90371bebbd89dbe49c717c493416558703c515236ab +size 3671900 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.1 b/model/model/layers/12/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..de08daa4014c9a60dcc323f12faa259a1c03f453 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ba71a856eb4a51d4e5c0d1817eed866280584ddbed36a2c502988232572864 +size 3672917 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.2 b/model/model/layers/12/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..40127e3259af97d07bf4e17a49f188cb9a9d5063 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce44f85e36f0e2c1aafd3539e94ea36bae413db24f7239e413e22b1c37868c5c +size 3671479 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.3 b/model/model/layers/12/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..32793c8b11824d75e49eeaf8d4d602d4a84e0e53 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6178702d0dd7bb7b20326c8f7f256d357e2825df2750ea8a4b7d4ca9b63d564 +size 3671530 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/.zarray b/model/model/layers/12/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/q_proj/kernel/0.0 b/model/model/layers/12/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a628c170b959ed6afece43a3f9d6e93dcb3ac112 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f14bf461718ff2d934f20d58d661ad24b2cadc3a8cbfd1590f861506f1677de5 +size 3706303 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/1.0 b/model/model/layers/12/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..22dc9c8df95029b474b6bc64df1e9b52232ca7af --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd7b3426522adaba041e302d3724c99c57eb94b9e0aa600519c026d4a9f16e54 +size 3706426 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/2.0 b/model/model/layers/12/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..90ace3b8aae1284671ce6a8210690da005cb4f0e --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34a513316a7c8ce5fe3ccba43b734ad3f614a31f748a593c6d97fcd42ea58fd +size 3706212 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/3.0 b/model/model/layers/12/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..df960527bab514c6628dea7bc0c7956f1a1a2a56 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb11d437979e8417a8cf1413743c9027965174e13b7bc4f6ec89fa5976aa968 +size 3705797 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/.zarray b/model/model/layers/12/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/v_proj/kernel/0.0 b/model/model/layers/12/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0d610733f7cb05ebef6236353885ef5f5a47d2bc --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97dea3f668610c307c0655545f201fc11bcb6fda1d3993ab8fd8ed5156b065bf +size 1225611 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/1.0 b/model/model/layers/12/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..70683b606c5ab327b590c0c4b332fa75b5969fa6 --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:930730da43ee95fa898e56d212b777a4c63e873255ad11cafd7198b17fabe163 +size 1225926 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/2.0 b/model/model/layers/12/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..747e404b7db79d5cfe409d2546002df24fd67280 --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047415f00b6b22cf6d13b7aba9423403ac6c8dbbe0575ffc1f7871d109647833 +size 1225629 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/3.0 b/model/model/layers/12/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3fc486bf86c49bb070c5493158f41a69eaab7972 --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2f0ed69cdef29e7b4d84347670710cee83b320d7e156edadc9d69a2ed872c7 +size 1224943 diff --git a/model/model/layers/13/input_layernorm/kernel/.zarray b/model/model/layers/13/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/13/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/input_layernorm/kernel/0 b/model/model/layers/13/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..2699751de750cfc1cf42a154161dd0924db27490 Binary files /dev/null and b/model/model/layers/13/input_layernorm/kernel/0 differ diff --git a/model/model/layers/13/mlp/down_proj/kernel/.zarray b/model/model/layers/13/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.0 b/model/model/layers/13/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6bc3429ab4fd510b84a53d8cf39db85fea956c81 --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb024a279b7f08458bdd965d64f592420655793ebca5b4cc3a7b46b1167f44b +size 9806848 diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.1 b/model/model/layers/13/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7f8a4faae7def452eeab3101c10dad1a4de14af9 --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ecc6dd829378f9121dddc9843f1ee060034c118a87d0993ee979edbabcfabf9 +size 9806906 diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.2 b/model/model/layers/13/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..31c305786463e7f16f85024f63221c10fa290d60 --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbfc982e3a35e3d083fd21c3113ee58080abfce63c5576cf2182c07349ef4eb7 +size 9805467 diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.3 b/model/model/layers/13/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ffe4551d2a34f9979cce3231fba7348932b475bf --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381203332c86e2fa8f1599aa4bce5313a79561789cecf3d5812d9fcbe35e825c +size 9806443 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/.zarray b/model/model/layers/13/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/mlp/gate_proj/kernel/0.0 b/model/model/layers/13/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f5953f43f41fd575d83dc0262f8fd33378033259 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a461b643ceacbec335fa9a5cb7318b8ca817f15c9b313d4aadb727a4f714c4 +size 9816160 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/1.0 b/model/model/layers/13/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..134a02c40ac108c70723473d387c053b59deb40b --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754b29d33656f0fbd6c57e8b5041a2738fa09cf93114b88eae29026b4e5de73d +size 9817626 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/2.0 b/model/model/layers/13/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..257628fff2b12e2c8411c705fc1f292e8df5c4f9 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d772f8fef3d0c7c0f65cb98d0d70638ae14b440a759b44c353de826e53f58069 +size 9816139 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/3.0 b/model/model/layers/13/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..fa7def21dea51a838e356be3c4938f1a8da24304 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01226f60366c37b5ac73d192c16023199c53902cf8b90d36763bedbb4c10bfbc +size 9814843 diff --git a/model/model/layers/13/mlp/up_proj/kernel/.zarray b/model/model/layers/13/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/mlp/up_proj/kernel/0.0 b/model/model/layers/13/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c73d53fac354beaa4c5240399e353d9f062947ed --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eeb0894c577f4d57549cb90e803a7ff72b0bf3063ce64482b2ed1e34495b28a +size 9808729 diff --git a/model/model/layers/13/mlp/up_proj/kernel/1.0 b/model/model/layers/13/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d2344eb9e2906ba860c048783f4dd1f554ea35ff --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5687afe8d6ef2170cd0967b534cce8c00ab971edbc0ea7e405a6134d68da738 +size 9809104 diff --git a/model/model/layers/13/mlp/up_proj/kernel/2.0 b/model/model/layers/13/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f8c3d4a505c0f44ee0d0a28cadb2030fc69ab33 --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2006f42a709d11fe8450ad47e08a94afb7e0ea93b583a290f867f200386c1f29 +size 9807591 diff --git a/model/model/layers/13/mlp/up_proj/kernel/3.0 b/model/model/layers/13/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3ed05831f1aaf52f13f3c8a03e5dcf04ccf7c1e4 --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af8e0f8102348412008f5afa72deae1724143e6667c69a2fb95ff262dadd06a +size 9805664 diff --git a/model/model/layers/13/post_attention_layernorm/kernel/.zarray b/model/model/layers/13/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/13/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/post_attention_layernorm/kernel/0 b/model/model/layers/13/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..41cae29ebeb9c517b79138b59475f4528f2c0570 Binary files /dev/null and b/model/model/layers/13/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/13/self_attn/k_proj/kernel/.zarray b/model/model/layers/13/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/k_proj/kernel/0.0 b/model/model/layers/13/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1adafd0079c043aac25a39b4dd7e1fc76d0de6f9 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bfbfb09c0311dbb5f1d38af44fe0e189c76a6c84ac0bf94fe746defb92fa64a +size 1234481 diff --git a/model/model/layers/13/self_attn/k_proj/kernel/1.0 b/model/model/layers/13/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9200b8706ee68b4e1d525688b3579136344b1be9 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4c22a22bfc6b68df5c76f904124f573dae51bfc38a05875a74dc22831d777f +size 1234616 diff --git a/model/model/layers/13/self_attn/k_proj/kernel/2.0 b/model/model/layers/13/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..2377123e9eea0e17a4f9901f5efd6b5922f1554f --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc988d3e34eb77feb2e9e60bd29a8cfb4125b4c2ebf00c36039df06742a9f5b7 +size 1234001 diff --git a/model/model/layers/13/self_attn/k_proj/kernel/3.0 b/model/model/layers/13/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5608e6bfda7a019cf3aa76d37dafae08b9639034 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:103c87dcfd28ac7a0bda75f57db5e473f7d761fd2fbd36cc70d3e3669ca90cc2 +size 1234129 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/.zarray b/model/model/layers/13/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.0 b/model/model/layers/13/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4430e77e5a55375e8ae62ffce8e8a0a953b4c731 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc9d4b719740637c373b2e07d0157ed1810511f21ee7969ac673b1a08aca4c87 +size 3673315 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.1 b/model/model/layers/13/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..22d844b9ace8dedfbf21ed2c80d30c59469a8b31 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41d040d4b7a7ce5eeeb37f3fd11ca10fd1e6d718ec5da2409c29948f50ea9ed0 +size 3673807 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.2 b/model/model/layers/13/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..8150b60698c7dba95f0e22e680f51db6544846e3 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d34fc88fb69a2e2219c0b29e9d266dace4f2f4e37428e5b51f0e6fac58abcb +size 3672941 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.3 b/model/model/layers/13/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0bbc7847c0b454e0e43f6d0441700624fe9fbe23 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2da5dd2b50d2bbb7be53289516270e7655aac139fe60df72e41e8d1674b239f4 +size 3672651 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/.zarray b/model/model/layers/13/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/q_proj/kernel/0.0 b/model/model/layers/13/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c3ce3180b1bcd92acbefe15e4269133576e2e0aa --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fff49365f3f62d5af113199acf8726df60d4a8c05f64a9f8e0d520c820d1fe7 +size 3701134 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/1.0 b/model/model/layers/13/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f507eb816032c612dfcc47f6d46407fc4627806d --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e29fd853191337df6980c05d946765da7998446fb9b3e2825fb595fea0208eab +size 3700842 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/2.0 b/model/model/layers/13/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..27de34173b2e97ebe713bbceba4e5ffa902f540b --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1155365fede5b71b3f352a43c3edf4c0b6211710e6e27a31bec25d0746325a05 +size 3700306 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/3.0 b/model/model/layers/13/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a3a20e85f6ca604aa77a641a58c452299bb4aad6 --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113fb8efcb0f9a42f688116cb3d83bbe757d86fc3653d1bafe33d7598f32d377 +size 3701388 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/.zarray b/model/model/layers/13/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/v_proj/kernel/0.0 b/model/model/layers/13/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d9caa5d7b70c867eed721d5d9a8bab98c7552d9c --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f410c9d1f1c6663930027610a737240d3cd93753d4c2819f6ec7eab71e543989 +size 1227943 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/1.0 b/model/model/layers/13/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ef98fbed46e4cc687eca9a450a0289f86f2e4bab --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d5ad67dfe5668b03cda1008f110e13a7eedd6c62f973d872613c5dbe1fa02b +size 1227958 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/2.0 b/model/model/layers/13/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..dc4229800f20dfbbf4e878f74ab963e3c03aa245 --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b368192e78ed3e364839721a7b3a18624b14d7792ae25cc2ecd80692e8f57ee +size 1227871 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/3.0 b/model/model/layers/13/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e98cd6ac0cf81cab56b32dcea7140446edafe560 --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16ba1129f56080df7d0b597c45322826e545f6e92eaecf77c871c4399f302cd +size 1227404 diff --git a/model/model/layers/14/input_layernorm/kernel/.zarray b/model/model/layers/14/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/14/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/input_layernorm/kernel/0 b/model/model/layers/14/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..39b918288945849a327dfe93d84da9622958cecc Binary files /dev/null and b/model/model/layers/14/input_layernorm/kernel/0 differ diff --git a/model/model/layers/14/mlp/down_proj/kernel/.zarray b/model/model/layers/14/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.0 b/model/model/layers/14/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d8169ab7cd1efdac4e66fbcdf2d7b5dc9dcd6600 --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d675b1ae7e72291f260a2be6f38a4e3bede16adb7ec68fa6c7a40a31b316d6ce +size 9803693 diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.1 b/model/model/layers/14/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7b1830254ec9621efd1cb8afa4a603e8c9336d70 --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2d30fd21e5bfdf294dd5de5245af6254d0e33c15fbb278ada3b582f57b8ad48 +size 9803462 diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.2 b/model/model/layers/14/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..441dd30a7e4578a73da0db8dbb6ca1384358930f --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:300e56dd110488e96012a15577c2ec2e4ea60a82dfb3ebd06b56e93e0081fa79 +size 9802691 diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.3 b/model/model/layers/14/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..53aeee967c268c43b9bd53d37e2df23dc8073ef8 --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0fee00a2cd22ebd409fedcb0282207b9f1f1e99bc90fd9ae64ab3cce64811e +size 9802739 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/.zarray b/model/model/layers/14/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/mlp/gate_proj/kernel/0.0 b/model/model/layers/14/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..db8749b181b782fd66affa618bf22f2fb521d6d3 --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4429b86acf57a9ec25de017d87daeec4cd8ae27e5f04378a0de24cbea97e435d +size 9811275 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/1.0 b/model/model/layers/14/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e0f7ad8b492e55d960dfb2c391ff275b94f16c77 --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff980375b18ad53d8448aedff2ef8e76ac7cc95996bf44b70bd15bf2e34c037d +size 9811627 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/2.0 b/model/model/layers/14/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d65035a4acf47e01fae8362135eb98a98a0a288e --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6afda82b34d98ebacbee90f6e818b1f03ad7482c1606145f1560e3b9143799c +size 9810780 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/3.0 b/model/model/layers/14/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..621b95e4b52798c1532b4cf8037b35934efce024 --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dac2800270aa40427ec775fe723c8818789ab88a53e6105a84ad28458f2f9b1 +size 9810527 diff --git a/model/model/layers/14/mlp/up_proj/kernel/.zarray b/model/model/layers/14/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/mlp/up_proj/kernel/0.0 b/model/model/layers/14/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ceafcb7e0843a6b9328213b1376e13c144384ade --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873e4d52190328bbd88305b48cb74779bf317cd7b7fc7a36b555a683584eb032 +size 9805348 diff --git a/model/model/layers/14/mlp/up_proj/kernel/1.0 b/model/model/layers/14/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..54ba46a85559423486d894c55f38a95a8525c698 --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f790ab7275f512f3cd42925cac03e0a37a00f917ffa3ea66916ccc715862d046 +size 9806560 diff --git a/model/model/layers/14/mlp/up_proj/kernel/2.0 b/model/model/layers/14/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1f35d754014b2e8480ab1aea6a1000340c848f2e --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:295ee12f76f5715a15efe0a8eaea13382402234331d2b53011535ba146106242 +size 9805001 diff --git a/model/model/layers/14/mlp/up_proj/kernel/3.0 b/model/model/layers/14/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a9b9186de4399b024c4d3c889685de1f02664b6 --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570d87e22808615c923fb7dba54ba6d68b6d2ffad164c61b48bc1e5d2136abb5 +size 9804388 diff --git a/model/model/layers/14/post_attention_layernorm/kernel/.zarray b/model/model/layers/14/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/14/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/post_attention_layernorm/kernel/0 b/model/model/layers/14/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..b8e237cc7474842d001cb61fd0eb0837dbb6a72f Binary files /dev/null and b/model/model/layers/14/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/14/self_attn/k_proj/kernel/.zarray b/model/model/layers/14/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/k_proj/kernel/0.0 b/model/model/layers/14/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9746aa90b499a82be466d5f996c02f3cfcc17ff3 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fcec67e17abd28829edf4477b7700f582e8e358e186156ab01ff8d7fbda9edd +size 1232453 diff --git a/model/model/layers/14/self_attn/k_proj/kernel/1.0 b/model/model/layers/14/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..aa3955aeef46f0671cea93157c17c79e53f70c50 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa477094d9f5608fbcdb80c5843e3ddd131823e59a451c083d0fd9602ddebc9 +size 1232426 diff --git a/model/model/layers/14/self_attn/k_proj/kernel/2.0 b/model/model/layers/14/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c41292937efae01ab3242af0c518d2d31cfdfe3f --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32e717be2249016492dd2326cf59dcfe8c3e58abc2cc832644c8b8e08d36a9e +size 1232503 diff --git a/model/model/layers/14/self_attn/k_proj/kernel/3.0 b/model/model/layers/14/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d283e0b60f46113ce5a9671950bdf7b99b067efa --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2429bba3cde229782b5b9dfa5dad8cef48fe0f7d8077977602316a6028d477c +size 1231920 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/.zarray b/model/model/layers/14/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.0 b/model/model/layers/14/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf742cf773c9074854b4cb17b1b00e23a6184862 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7245dce4d995e4c7bca393693db13e69bc28f573c6e55aaf1ea7ba742ce0b56 +size 3669146 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.1 b/model/model/layers/14/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ee36e436b079c3193196751799bcb332d678a656 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d64b8a8598833ca31bad31b68750ff4112cd710a06f3ee6682cc02e2db21477c +size 3670166 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.2 b/model/model/layers/14/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..286406219c25cdfe9b2fcbd62cdb42d5e31bc318 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efdc9b6687c0d3e39dd88f8f846e08b2da131bb342700b95c48c76278f8b820d +size 3669382 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.3 b/model/model/layers/14/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f9856c8d3781a55050eeb0ffb1f23f8f41bfc4a3 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398c974fda463c900e27bcd13d2d578bb56d520e36cc0493c747ccf9a811bdc7 +size 3669008 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/.zarray b/model/model/layers/14/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/q_proj/kernel/0.0 b/model/model/layers/14/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7c61cc90463065f080297cf5beabc59e21d29ef6 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a51496ce74be1c47f30972a8509ae788d91887e27e88f1c02a54298d42e89eb2 +size 3714113 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/1.0 b/model/model/layers/14/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..56e8dab2c8dc41ddfa6a19403e668249379a8d54 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca3db6256f66e960ecaa3a15361b00dcb0c5941a7fe6a3bb6162de9e28fad09 +size 3713612 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/2.0 b/model/model/layers/14/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..407982135bbe424071e18013575015b5085fda22 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049fc3b6547b63dca68e5b5d808a2f45eb4f942bd5e694a1853ac11d91aeade3 +size 3713360 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/3.0 b/model/model/layers/14/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d54a46b40c9fda07fa490252759644d86c9d8685 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac67d8fadbd0774ad98df8c12b5edfcc066f23967e91a4537d3ab5780844dcc +size 3713578 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/.zarray b/model/model/layers/14/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/v_proj/kernel/0.0 b/model/model/layers/14/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a4b3670a55785e0aa660cdaa06a3e64a461f2193 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:552fb9f2b17944711e312a161341cc191f9b4cc2b06886fc39e1d61dfbeb9d4a +size 1226978 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/1.0 b/model/model/layers/14/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..38a558ebc35a91a731b3274d5ce0391a53e4e547 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7d0e65808e45565add1ba165209221eba52d528b79ff66494e7de5a3898c37 +size 1227580 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/2.0 b/model/model/layers/14/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..0ee0358d1cfff3ad0ca6eb45beea1e3c808801a8 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d42b7dfdbc0e61838cd3e16d726f569c40b05772cfe79b9e7ab8972fce34a33 +size 1227078 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/3.0 b/model/model/layers/14/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f268d56e93fb5c79326d00745155d747f441724 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdcb2b333178ee448739976c159a9c7f12ffc26b997914d8a5ae3023afaecf1 +size 1226600 diff --git a/model/model/layers/15/input_layernorm/kernel/.zarray b/model/model/layers/15/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/15/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/input_layernorm/kernel/0 b/model/model/layers/15/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..b0447732b84a1fd814f88b4d187f97a7da3397d8 Binary files /dev/null and b/model/model/layers/15/input_layernorm/kernel/0 differ diff --git a/model/model/layers/15/mlp/down_proj/kernel/.zarray b/model/model/layers/15/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.0 b/model/model/layers/15/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3e91303eb0d5735efdd5895a96bcbf97e420d790 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c3e3243809321ac6fe8781f17ab7e208418f5fda00c5a92f63fe8851112778 +size 9800263 diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.1 b/model/model/layers/15/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..416358d198f494aed60b3dad6932844e75b8ec88 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826c32f84dc40312148cb4589e9b093b34d470f363b97a42d364819392852d4e +size 9800077 diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.2 b/model/model/layers/15/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..2adc52b7cdfc9a5e73f4db653d818287969d4216 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53fc548ed900cc2d59540b8230f743176a99538924df1a178b45f82ce0f46358 +size 9799884 diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.3 b/model/model/layers/15/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e5b8f967d3d9de2166035f1a765409f14e17f277 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:644e002ab63085cacd043ab48417c577f5086aec20c4760abb7d515bbee8fe58 +size 9800640 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/.zarray b/model/model/layers/15/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/mlp/gate_proj/kernel/0.0 b/model/model/layers/15/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..04c5799947c7e4cb45a496bda6ff524d5a2cc71e --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ebb66d2488c5b802afa97544a2750361c42dd613fa892ac4f371483a5e857bd +size 9814493 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/1.0 b/model/model/layers/15/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..119f90b025d9c82fb2f6d2cebbfb0aa7763dbf72 --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e339c02710e7f05c2e1814d72b2ae6900ac1f5aa3f13d9964bbf3eca1d9480 +size 9815289 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/2.0 b/model/model/layers/15/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ceb4d51a8a56101d4f8e5911534d1409141deef --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43e8f40990a167f8a76dab49cea130b4fdd685069cff032c58921517c953d37 +size 9814381 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/3.0 b/model/model/layers/15/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..4c5951fc2fdc2f3bb8d109923e9ad03968c0944c --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6b12880315c150ee381d03bd9659ffed3694046d6554984a4c86020dbec460 +size 9815044 diff --git a/model/model/layers/15/mlp/up_proj/kernel/.zarray b/model/model/layers/15/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/mlp/up_proj/kernel/0.0 b/model/model/layers/15/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..63d6b0507294fc22ebf208e2636dc6c3d157e5b4 --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cefec5134674d8f62d0dc4e36578c3b0cbc6ecee9e6b203af712a12d4751de8c +size 9800709 diff --git a/model/model/layers/15/mlp/up_proj/kernel/1.0 b/model/model/layers/15/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..23816deb741209df8e5e3c6011e8b9483fa63dc9 --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed434b775561a45997ba86310b941466e4844272fa9950c8f88678688940d94 +size 9800732 diff --git a/model/model/layers/15/mlp/up_proj/kernel/2.0 b/model/model/layers/15/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..93213230ea169ff43f4b66613de2626ec377b94b --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993621bdf5fac49157506ca3441f8dc2b51b55c7f55e39da92792a192378f361 +size 9799587 diff --git a/model/model/layers/15/mlp/up_proj/kernel/3.0 b/model/model/layers/15/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..bd639bc14843e2f09b72ed6412fc06803f03e702 --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc6e936b1e6ec172641d0cf1670897eec49a4d1deb010e8693b21953d7bf1df +size 9799659 diff --git a/model/model/layers/15/post_attention_layernorm/kernel/.zarray b/model/model/layers/15/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/15/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/post_attention_layernorm/kernel/0 b/model/model/layers/15/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..7e3654599e09acc52a99140a1281ae126e82f457 Binary files /dev/null and b/model/model/layers/15/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/15/self_attn/k_proj/kernel/.zarray b/model/model/layers/15/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/k_proj/kernel/0.0 b/model/model/layers/15/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..472a06f46a604ba49ccf6f9e6ff1321e4442440c --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6c967cc46172a0f607dc66d1166f5984670fa09299b6787c144f19b007ea3a +size 1233720 diff --git a/model/model/layers/15/self_attn/k_proj/kernel/1.0 b/model/model/layers/15/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..781bc9eb7c18213af3136fde97c2101e76aafdf9 --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45192ae1e52c6d188215ef4b9255bddd62b515b92d5fd17355b906df7afb9a58 +size 1233648 diff --git a/model/model/layers/15/self_attn/k_proj/kernel/2.0 b/model/model/layers/15/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..10ed5cef1eba416eb8d0045c0b632790f8689b7a --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9b0c6793bd3f567a7212c861a42f50975fe67ed6cc1c8a29f3984e57d608275 +size 1233463 diff --git a/model/model/layers/15/self_attn/k_proj/kernel/3.0 b/model/model/layers/15/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..06f9b1a2f11edb4c7985950ba5557d29ae11c29e --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289646beeaac25a2b36b55654d1ab65ea6024f0045f6826bc253ba2d3be575ac +size 1233470 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/.zarray b/model/model/layers/15/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.0 b/model/model/layers/15/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..00dbcdbfe146327ce7ecbff37dffccdbe858ad68 --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14cba11f2f0b4ce1209439fb77d4831a36623d56d5c9b8e0f315a2be342f9df5 +size 3669224 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.1 b/model/model/layers/15/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1731d1da9f6e5bba5b1e4ca9c000f22d65fd966b --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5e672a94f7d837062a3d8d872e5557aea078c3b2012a5718527a7642931ac1 +size 3669268 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.2 b/model/model/layers/15/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..15209ee475a5a32ee18feabdc45370e82344c343 --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bf9359305d1b9540d2a509741b3c9b83b6dae5b2ce6c6e47efe0925f019b24 +size 3669121 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.3 b/model/model/layers/15/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2c67c79c3f9a8457363be9f27d29d47a64cd9fdb --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c234b00694d22562052858fff048799f2dfed1f9b4f79fbe7da05e14f82bb8 +size 3668010 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/.zarray b/model/model/layers/15/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/q_proj/kernel/0.0 b/model/model/layers/15/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ed23b236654ae8f20e2057fd49e4ad8bd2722500 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f76f6187d1cfbd92fcf352c479d57346484466350612e834ab69ce4e3e3a665b +size 3706222 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/1.0 b/model/model/layers/15/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..20e8d860339f2951c0ee0434b93426363ecc3bd3 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceed5b789ac8b97875d048f4295586a1fcb46c632e26542bdacf9ce278e9107e +size 3706323 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/2.0 b/model/model/layers/15/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..23ce6688e5c6068a5a138a1aaff0d2b5e136393c --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e02ff34a1c8911d3af1d57417d7e51f279c3e99068a773b52e68d78581ca8e9 +size 3706428 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/3.0 b/model/model/layers/15/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..48ac0916ba2e25861ccc669a9351664dae084989 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97538ec48dac772047f4017985aaa25085f5b2f925c9e25986ad8edf6573f52e +size 3705671 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/.zarray b/model/model/layers/15/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/v_proj/kernel/0.0 b/model/model/layers/15/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7f4d5a6448eabb1b4d79b23425121cb81e8d9524 --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8742ebe73c9675a50be02da2b8cc1bd07a84a06533752514f858366b6e222918 +size 1224551 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/1.0 b/model/model/layers/15/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2423d2d1c89d3651b0873a3ce0e768571428104c --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd695895e8ccdb6d1fa2477155545549bd37389547ca5f46cbac33d9e13e035 +size 1224784 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/2.0 b/model/model/layers/15/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6886064eadeb3781ee76f76e06557cb03cf58254 --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e2ac27727b8b2f6e7e28b656c7de573e4022cf3b80da76563437d468196003b +size 1225051 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/3.0 b/model/model/layers/15/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..affb13b1cbf536d2703e91c821d73192ed18edfa --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cac7d40efffe0ef8061151d17a12efa9a1f3ad22ef2852489beec393907266e +size 1224021 diff --git a/model/model/layers/16/input_layernorm/kernel/.zarray b/model/model/layers/16/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/16/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/input_layernorm/kernel/0 b/model/model/layers/16/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..5df8f4330eda6cb409695ff6078db5d0af75acbe Binary files /dev/null and b/model/model/layers/16/input_layernorm/kernel/0 differ diff --git a/model/model/layers/16/mlp/down_proj/kernel/.zarray b/model/model/layers/16/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/16/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/mlp/down_proj/kernel/0.0 b/model/model/layers/16/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5bc92b9bc279f684d3f871ae0afd46d95c7ef2bb --- /dev/null +++ b/model/model/layers/16/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46d41cb929d78ceaf2d5235a8899e8a8b8d20a6533b849716f39fbc6be27d19 +size 9796269 diff --git a/model/model/layers/16/mlp/down_proj/kernel/0.1 b/model/model/layers/16/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..14e4dc0805ef9c8e1bf34011121f44b09e9ba9d6 --- /dev/null +++ b/model/model/layers/16/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071b00324a73f4a1bffb1d2f549e264bd63859bc5cc08d4b4f7128b304b43697 +size 9796523 diff --git a/model/model/layers/16/mlp/down_proj/kernel/0.2 b/model/model/layers/16/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ab1684208f3db91e9d462d28ae2259f745a410c0 --- /dev/null +++ b/model/model/layers/16/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1290f6b988c377ab0b44a813bc9b584a7b4bcabdc94e385cd6e95196f602f966 +size 9798021 diff --git a/model/model/layers/16/mlp/down_proj/kernel/0.3 b/model/model/layers/16/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..8088f9dfbc421f169a3ab28a3f6672dcc2eb3a6e --- /dev/null +++ b/model/model/layers/16/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88c706084b2546391f01fab1fa86d686851109e247fb47a3afdb0ae3eaba44a +size 9796788 diff --git a/model/model/layers/16/mlp/gate_proj/kernel/.zarray b/model/model/layers/16/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/16/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/mlp/gate_proj/kernel/0.0 b/model/model/layers/16/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..29a8a3219ff60c0cbc6f4b31d41888506c6c8cac --- /dev/null +++ b/model/model/layers/16/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b833f16fd512155285a2c869bd7628927cf17d71492dbccb85676562519ebd +size 9813619 diff --git a/model/model/layers/16/mlp/gate_proj/kernel/1.0 b/model/model/layers/16/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..929244e1d9106176e1a516a340e82e1b5f1dd165 --- /dev/null +++ b/model/model/layers/16/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34300a1567c29994d8a216b7823ea9b2da0fbdc2aa93637247897ab00fb0a8ea +size 9813574 diff --git a/model/model/layers/16/mlp/gate_proj/kernel/2.0 b/model/model/layers/16/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc961fceb5d020f2f80648c2b60d0da73f09b55a --- /dev/null +++ b/model/model/layers/16/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a7b1e5e221fdda2c040a3bab6411d535236dbc99b92765a8492111fcae0d26 +size 9813024 diff --git a/model/model/layers/16/mlp/gate_proj/kernel/3.0 b/model/model/layers/16/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ded67b17c2067c735aff146df44be8a745fb90af --- /dev/null +++ b/model/model/layers/16/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b37baed0e84ebc0da128fbe5958051ccd2a0e09e487ba81c07e8e490015cf4 +size 9813936 diff --git a/model/model/layers/16/mlp/up_proj/kernel/.zarray b/model/model/layers/16/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/16/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/mlp/up_proj/kernel/0.0 b/model/model/layers/16/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b3afb0752fd233ee6811912d2b0b64acc52f532a --- /dev/null +++ b/model/model/layers/16/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58cb36356d0f7d281c24dae313569cc3ea21763c31ca83f98b4b5a5aca2a229 +size 9794642 diff --git a/model/model/layers/16/mlp/up_proj/kernel/1.0 b/model/model/layers/16/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6c42e7c74d7ee7d9480e993386ef076d653c9448 --- /dev/null +++ b/model/model/layers/16/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97426f3534625388c45a4e30893206d6e3bc1d817d7b5b7acd3eeb90f2776d91 +size 9795015 diff --git a/model/model/layers/16/mlp/up_proj/kernel/2.0 b/model/model/layers/16/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ad9f2a17f779cfec59399ee544d01a73df504077 --- /dev/null +++ b/model/model/layers/16/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e8e11a72fdd96e8558e356350231a4595a886e1baa7de4d90a9b37c4e3a3b5 +size 9794719 diff --git a/model/model/layers/16/mlp/up_proj/kernel/3.0 b/model/model/layers/16/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..435a439eb1c4c2c581dc9c5da382f4ab84725954 --- /dev/null +++ b/model/model/layers/16/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63af3066e3159e2d411ca0fa71497849a9e885a51c5122001577611247760b1 +size 9793996 diff --git a/model/model/layers/16/post_attention_layernorm/kernel/.zarray b/model/model/layers/16/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/16/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/post_attention_layernorm/kernel/0 b/model/model/layers/16/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..53e2fe301625d378e25e215ac79065bd1baaa7bd Binary files /dev/null and b/model/model/layers/16/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/16/self_attn/k_proj/kernel/.zarray b/model/model/layers/16/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/16/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/self_attn/k_proj/kernel/0.0 b/model/model/layers/16/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6cc22d10f1a994adcdbc778dc45181a548144b50 --- /dev/null +++ b/model/model/layers/16/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2c2806ff9afae37d914118cb34cb45bdcfc43afe0852f3d463c9454900a97bd +size 1233669 diff --git a/model/model/layers/16/self_attn/k_proj/kernel/1.0 b/model/model/layers/16/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d4db8e9f192ba2b2aa2fe9f245c93b803f2d8c5d --- /dev/null +++ b/model/model/layers/16/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e935db6b74f1a0c48513ff2137571d35db85916dc88b408d11756972196c9bd3 +size 1233634 diff --git a/model/model/layers/16/self_attn/k_proj/kernel/2.0 b/model/model/layers/16/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a7cc4d314acf11a8a71936952055735ab93c9363 --- /dev/null +++ b/model/model/layers/16/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1dd0820e9de9934ee967866101e4ef5b05aa63b465dabe633441eed05c66add +size 1233483 diff --git a/model/model/layers/16/self_attn/k_proj/kernel/3.0 b/model/model/layers/16/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0572a8bcc8a366d9406ff2e6307503472c920173 --- /dev/null +++ b/model/model/layers/16/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ddc94af30296c140c84609c7c18ed124e35934a00d94d9831db6ff1f2450f20 +size 1233401 diff --git a/model/model/layers/16/self_attn/o_proj/kernel/.zarray b/model/model/layers/16/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/16/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/self_attn/o_proj/kernel/0.0 b/model/model/layers/16/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3f812788c6642d3285f1b57a38bb7b2831af5dc1 --- /dev/null +++ b/model/model/layers/16/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263ca7d00bba1f59a8a30c66c3e1ddc7e744efcfa68a51d43f97cd2cfb7a0ee8 +size 3666693 diff --git a/model/model/layers/16/self_attn/o_proj/kernel/0.1 b/model/model/layers/16/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1ab51ffc33799b4551da11c26912207b548ba19f --- /dev/null +++ b/model/model/layers/16/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f5fa97dba8c1647eac6804d09ef1f8c76f5dd5125dbe3097439bd30a785e77 +size 3666766 diff --git a/model/model/layers/16/self_attn/o_proj/kernel/0.2 b/model/model/layers/16/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..e4aaed01e475617013835e3871af8074e8f112de --- /dev/null +++ b/model/model/layers/16/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1884d29a000887615e8f8ffd0b44199bc4aaa54ff7c191cb861ec912658c403a +size 3666379 diff --git a/model/model/layers/16/self_attn/o_proj/kernel/0.3 b/model/model/layers/16/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..4e6950156d865cfd497ad39dc546b0ff074dbafb --- /dev/null +++ b/model/model/layers/16/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f92832f556564790e41a2db33687039b8c988a83dfcb7229ee6b58c3e1302860 +size 3666362 diff --git a/model/model/layers/16/self_attn/q_proj/kernel/.zarray b/model/model/layers/16/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/16/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/self_attn/q_proj/kernel/0.0 b/model/model/layers/16/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2040fc93b4fefd2f6770da4c710e51594fe48b9 --- /dev/null +++ b/model/model/layers/16/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd3ab47a893d8095e606e895b070851ba122e9bf79c0cd655c2a26028750376 +size 3701034 diff --git a/model/model/layers/16/self_attn/q_proj/kernel/1.0 b/model/model/layers/16/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..dbfecbf1c9fc47cec21ceda378479e8b82ad5c24 --- /dev/null +++ b/model/model/layers/16/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:647105d32df687a134f0d3fdf866dccd8644266b2457722c7647a90c64e0c2af +size 3700657 diff --git a/model/model/layers/16/self_attn/q_proj/kernel/2.0 b/model/model/layers/16/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..808cf2e6bec5532995740f63b6d06fb63ac8a003 --- /dev/null +++ b/model/model/layers/16/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b938c7554b973061302efa43de712e0f0ec2fd8e91f80f8c10b9ff9bd56d0709 +size 3700533 diff --git a/model/model/layers/16/self_attn/q_proj/kernel/3.0 b/model/model/layers/16/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..4d711d2e000b4ff651ea0bcece37406ac57edd76 --- /dev/null +++ b/model/model/layers/16/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322d2cb2f229a60855bb7f903350417120be310515fb4272369b692e424f9450 +size 3700140 diff --git a/model/model/layers/16/self_attn/v_proj/kernel/.zarray b/model/model/layers/16/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/16/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/16/self_attn/v_proj/kernel/0.0 b/model/model/layers/16/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..788184626b80ba5ece42c40332e5755e1a686a64 --- /dev/null +++ b/model/model/layers/16/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a319991088ca0cf83d36c0569dceb0c6787d002f9e4c22d42a1ac5ce6efd0b +size 1226393 diff --git a/model/model/layers/16/self_attn/v_proj/kernel/1.0 b/model/model/layers/16/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7cd8e868eee76a5aefb658e75a734c1e777a9452 --- /dev/null +++ b/model/model/layers/16/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acf98d5c9cee42f76084be44e3c9c34ddf23989179526a4d034d41ffdfcde3e4 +size 1226617 diff --git a/model/model/layers/16/self_attn/v_proj/kernel/2.0 b/model/model/layers/16/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..97167f79debb189847f45e1d10a2be3cecf660c3 --- /dev/null +++ b/model/model/layers/16/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc582257c8ba6ef366aeaf2a933fc8ead4069520b7125ebd007a3fea03c172fa +size 1226621 diff --git a/model/model/layers/16/self_attn/v_proj/kernel/3.0 b/model/model/layers/16/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..50bc16431291d47ee2e7a24fff1278c6a257c6b6 --- /dev/null +++ b/model/model/layers/16/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3306250935073c8e887541a01561a81da36d29f30de0f94386dfb3f4e54e05ea +size 1226079 diff --git a/model/model/layers/17/input_layernorm/kernel/.zarray b/model/model/layers/17/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/17/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/input_layernorm/kernel/0 b/model/model/layers/17/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..3ccd30812800fdcbbe4c5ee0178b9bb32d5779f6 Binary files /dev/null and b/model/model/layers/17/input_layernorm/kernel/0 differ diff --git a/model/model/layers/17/mlp/down_proj/kernel/.zarray b/model/model/layers/17/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/17/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/mlp/down_proj/kernel/0.0 b/model/model/layers/17/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d74ad3afd69f5ff6d4cad566f637eea4e5bbe7e1 --- /dev/null +++ b/model/model/layers/17/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b87f5807b8939b256a55340e2e8e21d8fef7c447a07b1f4b41355334bf42542 +size 9796125 diff --git a/model/model/layers/17/mlp/down_proj/kernel/0.1 b/model/model/layers/17/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..558cd73c6820b1e3c9fe30426a1f431222347c84 --- /dev/null +++ b/model/model/layers/17/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25db66459029919d9fddb8d866b07ec5c0bd950fec864e91729589387a6a938d +size 9796109 diff --git a/model/model/layers/17/mlp/down_proj/kernel/0.2 b/model/model/layers/17/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..41ccdd9a8e7e24298ed4cc6e251a83cdae2b26b3 --- /dev/null +++ b/model/model/layers/17/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b62b505406b35c62328e8031792a58641abc66880134da2f67292eb71f69673 +size 9795731 diff --git a/model/model/layers/17/mlp/down_proj/kernel/0.3 b/model/model/layers/17/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e9631a2663e983511d6275b43ec3b06de5d2485b --- /dev/null +++ b/model/model/layers/17/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d334a24decc84c218eec0a71efd70b6bc547d1aa0471235aacfbb1bae883e68 +size 9796214 diff --git a/model/model/layers/17/mlp/gate_proj/kernel/.zarray b/model/model/layers/17/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/17/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/mlp/gate_proj/kernel/0.0 b/model/model/layers/17/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..033ff757c410a86926270d7f98a5c1736bc62443 --- /dev/null +++ b/model/model/layers/17/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d77822152db4a9ab800347bf119a73cc20c73286a3c63eac7d895a02d63bcda9 +size 9813584 diff --git a/model/model/layers/17/mlp/gate_proj/kernel/1.0 b/model/model/layers/17/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..00a8435ed9279b972daa162fb2645610bb7bd292 --- /dev/null +++ b/model/model/layers/17/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77315352f2abd0bf30bdec422107de2cf74e1319b6432dda6db0afdfa2e6f83e +size 9813550 diff --git a/model/model/layers/17/mlp/gate_proj/kernel/2.0 b/model/model/layers/17/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1845a9ec10de4037a26435544d6873c3cf833fdf --- /dev/null +++ b/model/model/layers/17/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b824dce05c5d6c5094ae308632dfd71910c41dce384ee94cd05b607ceb2de2e +size 9812638 diff --git a/model/model/layers/17/mlp/gate_proj/kernel/3.0 b/model/model/layers/17/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d00f99d9cbadc1dac6236a7a68e4c2b22a833190 --- /dev/null +++ b/model/model/layers/17/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b0ad42c742b3edcee9ee4530d00b9216116e1251b8b22e21ea7af0351d960c +size 9813864 diff --git a/model/model/layers/17/mlp/up_proj/kernel/.zarray b/model/model/layers/17/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/17/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/mlp/up_proj/kernel/0.0 b/model/model/layers/17/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..930575767fe6899078e2c4b0865f85f5524745ca --- /dev/null +++ b/model/model/layers/17/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d31621cf4e92fdf4f921d7931048e0aa93ac9fb62347be1f7836a51df53971 +size 9793422 diff --git a/model/model/layers/17/mlp/up_proj/kernel/1.0 b/model/model/layers/17/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..75dfc80719dff014b20d18c6feaa7ccdce1f5d69 --- /dev/null +++ b/model/model/layers/17/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3b3fe0d71e51dfd080cb0651e60fd3d85a8ece1906b8ebcc3d700f5792cdf9 +size 9793415 diff --git a/model/model/layers/17/mlp/up_proj/kernel/2.0 b/model/model/layers/17/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..67b41912afbb88c4df2eee20c8df10cd38bc5e85 --- /dev/null +++ b/model/model/layers/17/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1286469ad79dae9eae5a587ddf902cf29fbd9c84589d860942b8d27862dd9e5e +size 9792027 diff --git a/model/model/layers/17/mlp/up_proj/kernel/3.0 b/model/model/layers/17/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..94d36f14789f643849c8015305bdde3cf17ea10d --- /dev/null +++ b/model/model/layers/17/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4bf42e6ef74fe6905c0187fd9bbe260cab4e964b7fe3c88b0958ed03c992021 +size 9792309 diff --git a/model/model/layers/17/post_attention_layernorm/kernel/.zarray b/model/model/layers/17/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/17/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/post_attention_layernorm/kernel/0 b/model/model/layers/17/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..3cced37a357ef00f51ab88a6192f8bef25e7490b Binary files /dev/null and b/model/model/layers/17/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/17/self_attn/k_proj/kernel/.zarray b/model/model/layers/17/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/17/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/self_attn/k_proj/kernel/0.0 b/model/model/layers/17/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..44079e877eedbab0fb2125056c0b471a47104647 --- /dev/null +++ b/model/model/layers/17/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa057c9a3a514ffe5c2cc440310cdbc7d70eb4f7dd34644f10466ec6849a4f4 +size 1232507 diff --git a/model/model/layers/17/self_attn/k_proj/kernel/1.0 b/model/model/layers/17/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d95d67c6f5b74b74317054caab181d81c0940cdc --- /dev/null +++ b/model/model/layers/17/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34e065f899b1068b4142ad67a362eed0959169d6e24aa4e075f65260092f9a9 +size 1232733 diff --git a/model/model/layers/17/self_attn/k_proj/kernel/2.0 b/model/model/layers/17/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9feda9dd61f850f45b37eb278e99f4947d38f873 --- /dev/null +++ b/model/model/layers/17/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff4c6bedaee49b145c43109d165288f52e72fd1a9a7cebe4d0313de12217e5d +size 1232839 diff --git a/model/model/layers/17/self_attn/k_proj/kernel/3.0 b/model/model/layers/17/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a7c4cc05e4c74dfeb7f4c8dd72bde46c94c1f430 --- /dev/null +++ b/model/model/layers/17/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88950297def1ccc968086b5af4588e8f0634e283bbc258b415cfe5065a54eecf +size 1232726 diff --git a/model/model/layers/17/self_attn/o_proj/kernel/.zarray b/model/model/layers/17/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/17/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/self_attn/o_proj/kernel/0.0 b/model/model/layers/17/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a158c375158c5f2b292992db9b6bea96ecfd33b7 --- /dev/null +++ b/model/model/layers/17/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:127c3e24369b576aa519dadea85e74c73d8b6211c5dbce8185650567e454a164 +size 3668367 diff --git a/model/model/layers/17/self_attn/o_proj/kernel/0.1 b/model/model/layers/17/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..dc55ea56636933d35183dbb96d59930700d73d24 --- /dev/null +++ b/model/model/layers/17/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae7518c861f7076c679f8f0ead5de518b2d13efae3868c2c8d9d1e193209f29 +size 3667937 diff --git a/model/model/layers/17/self_attn/o_proj/kernel/0.2 b/model/model/layers/17/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..01a7d88e8692a82ea592fd43b916aa3eeaaf810b --- /dev/null +++ b/model/model/layers/17/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31484e4564e7672411e994672f267e7da7b7bcf3a0af9d8d2f9079e55b682de +size 3668314 diff --git a/model/model/layers/17/self_attn/o_proj/kernel/0.3 b/model/model/layers/17/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ec9aa494c0356e4b007db693c6bd774acc24a99f --- /dev/null +++ b/model/model/layers/17/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777276cfd140984b09d45f2c6af9138320956a8647dea68bf970f662ac5f4d77 +size 3667590 diff --git a/model/model/layers/17/self_attn/q_proj/kernel/.zarray b/model/model/layers/17/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/17/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/self_attn/q_proj/kernel/0.0 b/model/model/layers/17/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a60a381b3c44b9583845840f691455faa0c9d145 --- /dev/null +++ b/model/model/layers/17/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d170b4e7036aee6e32d3a0a7fa321777459df97ddaf94119ee4641fae665117c +size 3700996 diff --git a/model/model/layers/17/self_attn/q_proj/kernel/1.0 b/model/model/layers/17/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8b22f275bc15fd05b9636c11d39c96c40c9fe7da --- /dev/null +++ b/model/model/layers/17/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a685d48792896a4d1bd9a19860550184adb734a835d87340ae427d4ba227ea +size 3701009 diff --git a/model/model/layers/17/self_attn/q_proj/kernel/2.0 b/model/model/layers/17/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..0629140ea9448986d453d111b9dd8223eaea8af5 --- /dev/null +++ b/model/model/layers/17/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857221a58e998b20f4b3a2fa02292833f5a4ff054b5da4b7ead1bd298ffc4c36 +size 3701063 diff --git a/model/model/layers/17/self_attn/q_proj/kernel/3.0 b/model/model/layers/17/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8975feb80f195dc13bd1c703b6bddf21d653ed1c --- /dev/null +++ b/model/model/layers/17/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e19e9bbb73bdb975e63685b5d30d0b7475bab953cae18a2c5fc4c50b0e4d761 +size 3700625 diff --git a/model/model/layers/17/self_attn/v_proj/kernel/.zarray b/model/model/layers/17/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/17/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/17/self_attn/v_proj/kernel/0.0 b/model/model/layers/17/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..15bea576c18f383b8c4de3219d1f3c8bdab50278 --- /dev/null +++ b/model/model/layers/17/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee1dc72d472c5cf0c0988f1c80e51fb546589c1c064b78d3b17a593a2557d90 +size 1226600 diff --git a/model/model/layers/17/self_attn/v_proj/kernel/1.0 b/model/model/layers/17/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..adb32a0f5bd743bad6878f6a8fd03f3a97f2cedf --- /dev/null +++ b/model/model/layers/17/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66bb56c2afa228cadb7ce41c50f224bea7284de3b262e70d39128263431dd571 +size 1226578 diff --git a/model/model/layers/17/self_attn/v_proj/kernel/2.0 b/model/model/layers/17/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..71d3bb79d4e9ce01f3060a252c0e77c621341040 --- /dev/null +++ b/model/model/layers/17/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5608ed288f8c29f2d4abfcdde1ddd71da6dba695cc687dc9842714e9040ec6f +size 1226453 diff --git a/model/model/layers/17/self_attn/v_proj/kernel/3.0 b/model/model/layers/17/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3cf96774ff776945b1e6cc7811798f6d5dff8bf0 --- /dev/null +++ b/model/model/layers/17/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1afdb1b5b834af97fb0d6b2ac7286b7f954583e106709c699902c1e3cd8f9a6e +size 1226256 diff --git a/model/model/layers/18/input_layernorm/kernel/.zarray b/model/model/layers/18/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/18/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/input_layernorm/kernel/0 b/model/model/layers/18/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..91dc3f77efda596fd0444c01bb919bf68c4c2640 Binary files /dev/null and b/model/model/layers/18/input_layernorm/kernel/0 differ diff --git a/model/model/layers/18/mlp/down_proj/kernel/.zarray b/model/model/layers/18/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/18/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/mlp/down_proj/kernel/0.0 b/model/model/layers/18/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a35ded36a125d15ad73c935ac05c296d6f34b784 --- /dev/null +++ b/model/model/layers/18/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d05dbdff3f2b2f43fb3c7d65ffa411836fd1a8106eb7546f36cdb9261fda901f +size 9795861 diff --git a/model/model/layers/18/mlp/down_proj/kernel/0.1 b/model/model/layers/18/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..f09fa34aad0ec44e754cc850fd21ec4550291639 --- /dev/null +++ b/model/model/layers/18/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0419230ebafa75650718f28d037bbbd7e870e93e5daabcea467e4893a47c9d +size 9796432 diff --git a/model/model/layers/18/mlp/down_proj/kernel/0.2 b/model/model/layers/18/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..a5bf98514c18c630e0082e1d182fbe2d84e32517 --- /dev/null +++ b/model/model/layers/18/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96416c0d2bb30cb17643929b60f52e5af4e794d50345a23d138d2e06260b958c +size 9796194 diff --git a/model/model/layers/18/mlp/down_proj/kernel/0.3 b/model/model/layers/18/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..019a3f1700029d057ce859f4c84e21b8e2836c2d --- /dev/null +++ b/model/model/layers/18/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86307137035275c0d0e09f1b1de772f93fac3b5250ffbbe13062286c3f80756f +size 9796017 diff --git a/model/model/layers/18/mlp/gate_proj/kernel/.zarray b/model/model/layers/18/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/18/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/mlp/gate_proj/kernel/0.0 b/model/model/layers/18/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8aa94321584508279fec806bf00ef9701041332a --- /dev/null +++ b/model/model/layers/18/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6760749b8ef4ea5fa68c11dafa6f4d2d0ab935356ef20f90781a79b384e85338 +size 9812358 diff --git a/model/model/layers/18/mlp/gate_proj/kernel/1.0 b/model/model/layers/18/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e0a6d67e2967d393aa11982d9f94e0b75b0056ee --- /dev/null +++ b/model/model/layers/18/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f31f67810ccd9fbe438f08d600118e254527600560d3f32bdfcf71c1c03133ca +size 9812609 diff --git a/model/model/layers/18/mlp/gate_proj/kernel/2.0 b/model/model/layers/18/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..897767f208d24b009645c2d477ea5b6b05509112 --- /dev/null +++ b/model/model/layers/18/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e310cb3450b9a1c49ae7b8fb7787119a541bd6206bbe66645203ea572d0828f8 +size 9811722 diff --git a/model/model/layers/18/mlp/gate_proj/kernel/3.0 b/model/model/layers/18/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9dd07bec109093c3d1ea14cea3191572919c3454 --- /dev/null +++ b/model/model/layers/18/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcee1cafa3aa5ccaa8ddf562cc1953bf5ab6fd8bca0fb6aba8c13596ca4119e4 +size 9812360 diff --git a/model/model/layers/18/mlp/up_proj/kernel/.zarray b/model/model/layers/18/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/18/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/mlp/up_proj/kernel/0.0 b/model/model/layers/18/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4c7d90036cd68f964537c6110fb608ffbd1f5089 --- /dev/null +++ b/model/model/layers/18/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be226e7c5c1194dd7a1ded7a2058f73659d89267b2add890aeaf938f0b39b1d4 +size 9792749 diff --git a/model/model/layers/18/mlp/up_proj/kernel/1.0 b/model/model/layers/18/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a332ff8a0ac6ed0522fcad87e83eb90d5d548b3f --- /dev/null +++ b/model/model/layers/18/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2502713a92eb647c6aa1151f9b2091a314068751323003e6769ff70ae07dd85a +size 9792669 diff --git a/model/model/layers/18/mlp/up_proj/kernel/2.0 b/model/model/layers/18/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ca3c9e787a9685223fba3e36236eab61cbb11d05 --- /dev/null +++ b/model/model/layers/18/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3407097bae1535a734e9699e3f0c925f2c350508128145bc918dc80941e8fb4 +size 9792664 diff --git a/model/model/layers/18/mlp/up_proj/kernel/3.0 b/model/model/layers/18/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..77255d0e7c044e8768c00ffa09d261b578ed0ba9 --- /dev/null +++ b/model/model/layers/18/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2143beaa095976d1fcff5a28aba23884a37baff33ffef9565e775dfa2622d336 +size 9791039 diff --git a/model/model/layers/18/post_attention_layernorm/kernel/.zarray b/model/model/layers/18/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/18/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/post_attention_layernorm/kernel/0 b/model/model/layers/18/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..e5826ed41566087aa661d3c359b122878c157fe7 Binary files /dev/null and b/model/model/layers/18/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/18/self_attn/k_proj/kernel/.zarray b/model/model/layers/18/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/18/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/self_attn/k_proj/kernel/0.0 b/model/model/layers/18/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..399614b39193e55796218fa174de4ba104fc5b6d --- /dev/null +++ b/model/model/layers/18/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39343716c2b2a77ec3d0ed426293ba836b928b18c5ea044009f8b51791e7463b +size 1233566 diff --git a/model/model/layers/18/self_attn/k_proj/kernel/1.0 b/model/model/layers/18/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0bf5acb811e5c43a03122621deffdc372f0bc0bb --- /dev/null +++ b/model/model/layers/18/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82bbb614e988130b5fe17ce1f4c43e06ea51bdb468d21949a0afcabf1dc48b1f +size 1233490 diff --git a/model/model/layers/18/self_attn/k_proj/kernel/2.0 b/model/model/layers/18/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b775c31c0ea3e43728cdf31aa4d62fbcf3cc4a3a --- /dev/null +++ b/model/model/layers/18/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffc7de88f691044468e3fcef72e92d55fd5f1624352d70c925e3242f6e79a1a +size 1233664 diff --git a/model/model/layers/18/self_attn/k_proj/kernel/3.0 b/model/model/layers/18/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..920dd5731e22d2d62589e5c9d30cd63c29b80dd0 --- /dev/null +++ b/model/model/layers/18/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a5d92f64f57de5cf752071bef93b211bf1c526dc1d866ab83c5996c5aa208f +size 1233659 diff --git a/model/model/layers/18/self_attn/o_proj/kernel/.zarray b/model/model/layers/18/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/18/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/self_attn/o_proj/kernel/0.0 b/model/model/layers/18/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..452a6bbf430787a98c70427051a4a60f33e90f0e --- /dev/null +++ b/model/model/layers/18/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25240f04056d48d7276b5893040334a7e1e97f48035667cb7706524311bd58d0 +size 3666830 diff --git a/model/model/layers/18/self_attn/o_proj/kernel/0.1 b/model/model/layers/18/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..29c85c8ad3d6d657bec3813779836863250eafd9 --- /dev/null +++ b/model/model/layers/18/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa2efc568b2474ed830c4d2c0f4c95d0a63b1a34f3c4670e352ef28c88779eff +size 3667519 diff --git a/model/model/layers/18/self_attn/o_proj/kernel/0.2 b/model/model/layers/18/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d4bb53a8aed8fec995680b604ed07c07bc70a3cc --- /dev/null +++ b/model/model/layers/18/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90332e06f386871d786a805541210f15b075dd417d4bf6f7723ecda22fca6149 +size 3667118 diff --git a/model/model/layers/18/self_attn/o_proj/kernel/0.3 b/model/model/layers/18/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..5e22bd94a64865255987338c312e104ceed5fb5b --- /dev/null +++ b/model/model/layers/18/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90bbdc72141b03d3af3a3858ac3d3eb08acd16ee857bfd4678beb3de6aae1acf +size 3666605 diff --git a/model/model/layers/18/self_attn/q_proj/kernel/.zarray b/model/model/layers/18/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/18/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/self_attn/q_proj/kernel/0.0 b/model/model/layers/18/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ff0dc87409b41d7af0ef2574afe278ca71b5e801 --- /dev/null +++ b/model/model/layers/18/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ecce5f7f69804555501dc9fa9fa550b50da6879295d65252f3d748179a0a39 +size 3704168 diff --git a/model/model/layers/18/self_attn/q_proj/kernel/1.0 b/model/model/layers/18/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7b94df7bcb613a063f984c36154809f92965dc76 --- /dev/null +++ b/model/model/layers/18/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd242c3c615825527a99ffd865704dd350c847eb9c6141b1fcaac1532baeca8 +size 3705237 diff --git a/model/model/layers/18/self_attn/q_proj/kernel/2.0 b/model/model/layers/18/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8c937442ab19b50fc6eccc076010d801a4df424e --- /dev/null +++ b/model/model/layers/18/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6093c2144470d3087524b0669ea5c69227ca9bb3247c6e4d00b7aee4efe1213 +size 3705017 diff --git a/model/model/layers/18/self_attn/q_proj/kernel/3.0 b/model/model/layers/18/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..48b35a037a0b4a4b599cdd9a523403c294f46254 --- /dev/null +++ b/model/model/layers/18/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9254176a31c32ab6f1a1b384e5b46eeb9415a049e1ff4294ad3c0d297a6e946f +size 3704820 diff --git a/model/model/layers/18/self_attn/v_proj/kernel/.zarray b/model/model/layers/18/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/18/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/18/self_attn/v_proj/kernel/0.0 b/model/model/layers/18/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a9889922cd6bf0602125b110d873c9e331d2fd46 --- /dev/null +++ b/model/model/layers/18/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fec7e810ffcb83164176647b866e6684fb35a387caef73b8ea46478b80f3d5 +size 1226920 diff --git a/model/model/layers/18/self_attn/v_proj/kernel/1.0 b/model/model/layers/18/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d705e89c78c3d588d25a2ffc9615402a73fe75ca --- /dev/null +++ b/model/model/layers/18/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e734a956c91725a9581365a7110a566a421c59f4718a514ef88930b3df9fd0d5 +size 1227644 diff --git a/model/model/layers/18/self_attn/v_proj/kernel/2.0 b/model/model/layers/18/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..cb677a785eac6537b6425b0f61379e6ee063b1be --- /dev/null +++ b/model/model/layers/18/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0395980732deb4194ebb91d2400832dffeb01a7072fed2e69e46a7eeeb46c9a9 +size 1226931 diff --git a/model/model/layers/18/self_attn/v_proj/kernel/3.0 b/model/model/layers/18/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a4ad786a84e19a85748b038dac1833de55c8ca18 --- /dev/null +++ b/model/model/layers/18/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c498c6bf135df50d017c9c004c66a33cc02e6d7d78199c6fc4947fdf97a4f4 +size 1226827 diff --git a/model/model/layers/19/input_layernorm/kernel/.zarray b/model/model/layers/19/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/19/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/input_layernorm/kernel/0 b/model/model/layers/19/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..4e08b986f584eda3788fb23039a677cc9ece91ba Binary files /dev/null and b/model/model/layers/19/input_layernorm/kernel/0 differ diff --git a/model/model/layers/19/mlp/down_proj/kernel/.zarray b/model/model/layers/19/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/19/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/mlp/down_proj/kernel/0.0 b/model/model/layers/19/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2853635dc5966eda93a21f132918b400513c03ce --- /dev/null +++ b/model/model/layers/19/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf796f43c354f39e9d15869918a198088fd35a4ed7dd53e2d295a54fef739839 +size 9797985 diff --git a/model/model/layers/19/mlp/down_proj/kernel/0.1 b/model/model/layers/19/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fbec035163ab463f624f9b924e2837f2ae0aec8f --- /dev/null +++ b/model/model/layers/19/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ddcd6f10886b446406e79de1d2cf91e523a0cc850b9d35941d34be0097533c0 +size 9798201 diff --git a/model/model/layers/19/mlp/down_proj/kernel/0.2 b/model/model/layers/19/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..c306cb8770ad53435748fcb3ca856e108aecad87 --- /dev/null +++ b/model/model/layers/19/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3be2066efb0345981de0b1a3d6f134273cb525224b773e26fa2b5c887994571 +size 9798314 diff --git a/model/model/layers/19/mlp/down_proj/kernel/0.3 b/model/model/layers/19/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..a56b919cbf747594d7f0051701deeedfe1fc2a5a --- /dev/null +++ b/model/model/layers/19/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a569c50a85fe16a02a413a82db629bbb0f0b57baa738630f67bbfcb7a069af9a +size 9797470 diff --git a/model/model/layers/19/mlp/gate_proj/kernel/.zarray b/model/model/layers/19/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/19/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/mlp/gate_proj/kernel/0.0 b/model/model/layers/19/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..684125e3272f35a7466850443bc171d32d1da8f6 --- /dev/null +++ b/model/model/layers/19/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80cbc5d68119a3b9fb52149695a6eb44f6b451fc33fc368637a8c093434a9eb +size 9812380 diff --git a/model/model/layers/19/mlp/gate_proj/kernel/1.0 b/model/model/layers/19/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c3f77117f4c5608e783668201b48907678b944d9 --- /dev/null +++ b/model/model/layers/19/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29eb84c3579c69c62e079b4bc7b4b4393c8298445b57d47b4441b39dc1f2481c +size 9810922 diff --git a/model/model/layers/19/mlp/gate_proj/kernel/2.0 b/model/model/layers/19/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..68ae2a3b5cbfb72139a0ae62192d3a3d39c49c47 --- /dev/null +++ b/model/model/layers/19/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:866728c1c3f60e5db3c0cdbd1e80b428e98315f7d4f1b862f198a5b4a95e78dd +size 9812288 diff --git a/model/model/layers/19/mlp/gate_proj/kernel/3.0 b/model/model/layers/19/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c1ecf661edff395585b8252396e6c765224bd308 --- /dev/null +++ b/model/model/layers/19/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb31337118d00fafa80ab9541fb3ccc39abf4918f360ac27fd474c2de5c0bf6 +size 9812412 diff --git a/model/model/layers/19/mlp/up_proj/kernel/.zarray b/model/model/layers/19/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/19/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/mlp/up_proj/kernel/0.0 b/model/model/layers/19/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e2a859f7bea386d9306556712aa11c280b62431a --- /dev/null +++ b/model/model/layers/19/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b8d2c84baf7b74275e7776bcc702b0478897c0b46caffd73de7e695100c6494 +size 9792968 diff --git a/model/model/layers/19/mlp/up_proj/kernel/1.0 b/model/model/layers/19/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..250b2538045160ce7e9bd918dfe92ef6db8ec061 --- /dev/null +++ b/model/model/layers/19/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de8048ccccc2e2eadc6d0296983d5d2749e1a76214a27d00d36a7e0b601d5a7 +size 9792908 diff --git a/model/model/layers/19/mlp/up_proj/kernel/2.0 b/model/model/layers/19/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..834c92233f4a5f3ae41030aff5fc09bb849fa774 --- /dev/null +++ b/model/model/layers/19/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c79bc6a8ce310ab3b6b35e945b4ec6d200199599489b550812d887c174ae18d +size 9792767 diff --git a/model/model/layers/19/mlp/up_proj/kernel/3.0 b/model/model/layers/19/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8f627c662068e3bd8c056b7b58e50dd257668a4a --- /dev/null +++ b/model/model/layers/19/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f502868ceb82ce711752657b418f6639df3f797b97c4b5d2cea0ae4cbd414456 +size 9791456 diff --git a/model/model/layers/19/post_attention_layernorm/kernel/.zarray b/model/model/layers/19/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/19/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/post_attention_layernorm/kernel/0 b/model/model/layers/19/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f25b4d801bb32e699834dc980e0f8ead07bd0043 Binary files /dev/null and b/model/model/layers/19/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/19/self_attn/k_proj/kernel/.zarray b/model/model/layers/19/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/19/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/self_attn/k_proj/kernel/0.0 b/model/model/layers/19/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bf5f972a0f1c069363803eb3ec4deaa101d637b6 --- /dev/null +++ b/model/model/layers/19/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9131b4e948664474dec0a71724743a96a7ca87c7073640bf4b529e5b84f185fe +size 1231927 diff --git a/model/model/layers/19/self_attn/k_proj/kernel/1.0 b/model/model/layers/19/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ea9e54fd050dde031618f2838d2d7d4652b948d --- /dev/null +++ b/model/model/layers/19/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db57fee1febdb16e139c65981f56703fc3d63d7f92c70cc7197a3252a6fa8a41 +size 1232146 diff --git a/model/model/layers/19/self_attn/k_proj/kernel/2.0 b/model/model/layers/19/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc82d14aa371cab15dc9c0d6d774d8b2dd566a29 --- /dev/null +++ b/model/model/layers/19/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16909264e1dfe4c2e79214c3f4b2e85f47ff1e5c922466cf303ed395f637273 +size 1231986 diff --git a/model/model/layers/19/self_attn/k_proj/kernel/3.0 b/model/model/layers/19/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6565d846fb3af10a6ddf8948d5602d8e0164c5db --- /dev/null +++ b/model/model/layers/19/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7e359bd1052fdfdb38e66997736a21a85af52bae694c63ee049a12a5d73538 +size 1231323 diff --git a/model/model/layers/19/self_attn/o_proj/kernel/.zarray b/model/model/layers/19/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/19/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/self_attn/o_proj/kernel/0.0 b/model/model/layers/19/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e4d90ae99019309ab3ff2c713d4729f8e413405c --- /dev/null +++ b/model/model/layers/19/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c1662aabb077fae7c981427441f1c5150245711c21a56f318ffec1d13fddc6 +size 3669529 diff --git a/model/model/layers/19/self_attn/o_proj/kernel/0.1 b/model/model/layers/19/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..add96dda129171ed12d275fd8ab57c07932040a3 --- /dev/null +++ b/model/model/layers/19/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce44ba60f671c27cd4df4bf1f249ea558a1f1e3a0e8700b9ede39f3f704d1ef +size 3669696 diff --git a/model/model/layers/19/self_attn/o_proj/kernel/0.2 b/model/model/layers/19/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..21a25f5bedfde1377f92b7ce2997f230cc79c22e --- /dev/null +++ b/model/model/layers/19/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c2035283de6b357d3ee62d461246745596caf0b1b872c8e40aa29a7b75493d +size 3669984 diff --git a/model/model/layers/19/self_attn/o_proj/kernel/0.3 b/model/model/layers/19/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..262d9c1c7e908dfc644854438613bfa7f41ba16c --- /dev/null +++ b/model/model/layers/19/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb4b12566b78ddb8f26683b767dede968dd9f149e9aa14acfa6fca55fe4dc92 +size 3669688 diff --git a/model/model/layers/19/self_attn/q_proj/kernel/.zarray b/model/model/layers/19/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/19/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/self_attn/q_proj/kernel/0.0 b/model/model/layers/19/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..518102cdaa9cc524e43bbc7662a7102369cfd3a4 --- /dev/null +++ b/model/model/layers/19/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1777dc01aefc1a722622b78c2aa3f542abf2ea1ec674b610346ad8fb10ad5310 +size 3698412 diff --git a/model/model/layers/19/self_attn/q_proj/kernel/1.0 b/model/model/layers/19/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ef43027030058f0782446b4f450f4084b0098222 --- /dev/null +++ b/model/model/layers/19/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:530a8f08859f4a746cb79861f1c22e02e22cb6d7274e4842fa220f5754ee1465 +size 3698568 diff --git a/model/model/layers/19/self_attn/q_proj/kernel/2.0 b/model/model/layers/19/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2e8f513572b79e50303f1003294e629aa988387 --- /dev/null +++ b/model/model/layers/19/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d91bf331757b296bf288275e3163ffbe126d31a82658659933ea5df8f53bde +size 3698645 diff --git a/model/model/layers/19/self_attn/q_proj/kernel/3.0 b/model/model/layers/19/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1f1a80b6e41aa56b33f1e7718a2484680dd0e4bf --- /dev/null +++ b/model/model/layers/19/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59de9d372cb71d3278ed791927514e49f37f4f91ff3f9c4b8a14c92da414ec93 +size 3698496 diff --git a/model/model/layers/19/self_attn/v_proj/kernel/.zarray b/model/model/layers/19/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/19/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/19/self_attn/v_proj/kernel/0.0 b/model/model/layers/19/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9e3c92886cef113824691b7e70163072f60fe781 --- /dev/null +++ b/model/model/layers/19/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ccf4be88f371a1e6a01a0aaafb5eae131c76c20a7be8f06db896a6efd6b0b9 +size 1225699 diff --git a/model/model/layers/19/self_attn/v_proj/kernel/1.0 b/model/model/layers/19/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..fa81fd7117f5191395d68395bc1dddb8049db170 --- /dev/null +++ b/model/model/layers/19/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11f713a46457b93b4db00bbc69ed90d1dcaae123d83a573f711ce3a2e216feb +size 1225676 diff --git a/model/model/layers/19/self_attn/v_proj/kernel/2.0 b/model/model/layers/19/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..06e7e1815fb4a7b92b2a5b238e3c94d14bc2245c --- /dev/null +++ b/model/model/layers/19/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2811837bfc4cd54fccc9b22afd31c1449a7b965681e6cd6b98ccd4ff1fbf2b57 +size 1225509 diff --git a/model/model/layers/19/self_attn/v_proj/kernel/3.0 b/model/model/layers/19/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..034dd69ab3293d187fe7572629f570963e1f1e7d --- /dev/null +++ b/model/model/layers/19/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ddccbb02e9c243703babe2d867c79892970f4906a52610173c8d028c6a0ce9e +size 1225446 diff --git a/model/model/layers/2/input_layernorm/kernel/.zarray b/model/model/layers/2/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/2/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/input_layernorm/kernel/0 b/model/model/layers/2/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..9754390c805afb589986f5f4c185c13a6c67770e Binary files /dev/null and b/model/model/layers/2/input_layernorm/kernel/0 differ diff --git a/model/model/layers/2/mlp/down_proj/kernel/.zarray b/model/model/layers/2/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.0 b/model/model/layers/2/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f9b9ebfbac46ff9635fdbd9d1f1d8f43644aba3b --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02150aa645010433475037d4321e1c50bdb11ca9906e47c2ca6b95d80613ae28 +size 9791591 diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.1 b/model/model/layers/2/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3a542c99cb97c026893274a8196641838429edce --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3292bd02c63b7da88f4a71b360d94044687b932a266b36f2a749a177f8d26105 +size 9791060 diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.2 b/model/model/layers/2/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..9c925a1f3990ea2e20ce7a259b1d7b79905cf0b2 --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fe67cf950f4fe85ea49f09fd0f46f2ffc55ebf48a024dae2aca51b8f232f1ef +size 9791264 diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.3 b/model/model/layers/2/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..518de4f616bf7919377508da61b23b9a813e67b1 --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1729820086e8140d9fac13dfe4f66d72771c568faac160067b8f789f3983c4eb +size 9790741 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/.zarray b/model/model/layers/2/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/mlp/gate_proj/kernel/0.0 b/model/model/layers/2/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2582d7991ee173631adc7edbf10e6d1c69209034 --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8af2dfed68e9f8fc3afd5d82845562fb01dc336ca1f3efdc532c3c3e1029851 +size 9802104 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/1.0 b/model/model/layers/2/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5f7dd8e5686069f83779348e561815887602775a --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b582be051a3ddd902417c28654ea6e36f1e6fc133cfdff374fb82c9eea46c1c7 +size 9800125 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/2.0 b/model/model/layers/2/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8da4e7cc618bc17f36f1153c9dad592326911e0f --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36ca2de7016d2ed2b498070111eec76565d4b373990d6932fd493262b12f3408 +size 9801535 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/3.0 b/model/model/layers/2/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1c5f269679c918004f5380b78e25705a1e705044 --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea799554d8323082d4be3ae5ab6b40b684ed3ec5fbdfafb4e5e1193538ac2d7 +size 9800055 diff --git a/model/model/layers/2/mlp/up_proj/kernel/.zarray b/model/model/layers/2/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/mlp/up_proj/kernel/0.0 b/model/model/layers/2/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..52d0c64e3d93d0070f1617b4fddc2a5e486e57bc --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c9a5c230da8c50dbe8202dbce23a01485eb8a7a2376b47beb7fde9e365b9d6 +size 9792900 diff --git a/model/model/layers/2/mlp/up_proj/kernel/1.0 b/model/model/layers/2/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b069c50ee8fdb1b93e571e35f5cc9d90b391d8f --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4cfcba516a4781e42da6c9a206ba0a6c4bfc99389d22d85d110a10c663486d7 +size 9793637 diff --git a/model/model/layers/2/mlp/up_proj/kernel/2.0 b/model/model/layers/2/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5ee984491f186864a670f797b1583d8389df67b6 --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee3e34751be4a41f64cf5bf9c49c28e58fccba206f7b5d687f85d65328a5e71 +size 9794838 diff --git a/model/model/layers/2/mlp/up_proj/kernel/3.0 b/model/model/layers/2/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..347fd416512e3b6b45de4ad669f383dd6e7157dd --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e823ec8cd1fac94a7b1cdd6adb899077be2834f008ee68f8338d9bcc1a50e70 +size 9792869 diff --git a/model/model/layers/2/post_attention_layernorm/kernel/.zarray b/model/model/layers/2/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/2/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/post_attention_layernorm/kernel/0 b/model/model/layers/2/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ef6ed3b2ecb13e4ac7dc6738823c8f95632adb0c Binary files /dev/null and b/model/model/layers/2/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/2/self_attn/k_proj/kernel/.zarray b/model/model/layers/2/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/k_proj/kernel/0.0 b/model/model/layers/2/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d1f6a6cb4ff536a183e5dfefd3d17e7cb0695f4f --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e38651293a9cec033258a73faf03b456793cbf37a8bc0a4e369fb8ad2df419 +size 1238503 diff --git a/model/model/layers/2/self_attn/k_proj/kernel/1.0 b/model/model/layers/2/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e30ddf8f1b7295137ffca1182b177ae1946c7dd7 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6adc4f08bc487116d28ae57ef7294f02b1145f29793ddbb19360ccf978e636f +size 1238747 diff --git a/model/model/layers/2/self_attn/k_proj/kernel/2.0 b/model/model/layers/2/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1075d04f55a24b3fe84a86ea8c8f8b67499191c4 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f87b396857a3ba3405402630c55f399ca2cb4c7fac235c0fb03d183fb0fa76 +size 1238963 diff --git a/model/model/layers/2/self_attn/k_proj/kernel/3.0 b/model/model/layers/2/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..fd740c9e9763b2de4419658f702ff68aeb2be0f4 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196f8f532b1574ae25ad9af4e4946010a6e4733cad04467a0ff5de2f77b15c02 +size 1237810 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/.zarray b/model/model/layers/2/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.0 b/model/model/layers/2/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2067b3b4fe062cefa48d4a470d0b9ad883800f35 --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d61493187a84e540c86fc3661c9c98c6e94d95d7859c186cb16324fc815f0d8 +size 3673217 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.1 b/model/model/layers/2/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..9c75b37f1637cb679f65d058b5d0c9c33c8f7bcb --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284e7a0b744ca2c6238024c464ab00f1bbc29b2bb6101ac43cc0003caace7876 +size 3672586 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.2 b/model/model/layers/2/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..79bc44b37448b2ca9d67133ff4038cf2a2d2ddc5 --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13192fe797e68d54b69476565bb0d3c51682f6ca47f869569af16817791acdce +size 3672044 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.3 b/model/model/layers/2/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..637624ae1b8a35fe1bb736fefb75cefcc2127f5a --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe40585ab30a930697d439ec82db8a3e39b8ca84034d11b48320062e420243d +size 3673523 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/.zarray b/model/model/layers/2/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/q_proj/kernel/0.0 b/model/model/layers/2/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1be526aec56b3b5b0f9b3421c39fff0b8f9de6fd --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58015c09b69f6e6373f8f1b7f24405b862035aea4678658e80a5a863f7770613 +size 3711300 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/1.0 b/model/model/layers/2/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe848ca888d262ff41ff6df812e7b443ec1176a8 --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5397d25dc1adf01e6f4224af71236ac0d6e2b04ff2a807241ef710ceeb68669 +size 3712440 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/2.0 b/model/model/layers/2/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..66e6f5697098cff13ff27a178dd908d73d6e0f70 --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334c1ce0d9025ff72c77bbae6613c82296efbf68560ae37cdda687d81e8c0bff +size 3713804 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/3.0 b/model/model/layers/2/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..427123d341996d930473b153767cbebdaa77dde3 --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4a9be240d5ada5977367300c33bd936223e844aeef5158be96b7e964d21fcf +size 3711312 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/.zarray b/model/model/layers/2/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/v_proj/kernel/0.0 b/model/model/layers/2/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0c46678f943c8cba4dbea12b7075937c0a76e480 --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99a209792bd0d494ce49cdc8f1c7954b9c23da4914e03bf32a4e09f8ba85268 +size 1229742 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/1.0 b/model/model/layers/2/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ac27007cc066f9db4105ef399c15c82adf3ab3f --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b4ba0824cff99e6f1b6f137e6152793c54091d84e3bb55473b49b1048b029f +size 1230012 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/2.0 b/model/model/layers/2/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c36a2096e6dcfc016f8f53912882f8c9768d7775 --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b4d9cb692724bf46f4c914c3e17a0263ed121a82f935a0b4fb3547f16c70920 +size 1230261 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/3.0 b/model/model/layers/2/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..24e93c78529e6cc27d94a3871dcfe8f3b90f9980 --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f2422828219b8ca2b3a352fc1ea7c27e7d2cd28cf1fe7f3d0b6a3b05490f9f1 +size 1229729 diff --git a/model/model/layers/20/input_layernorm/kernel/.zarray b/model/model/layers/20/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/20/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/input_layernorm/kernel/0 b/model/model/layers/20/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ec41528206e0a5aeada1bf341cdfb9d5275fb922 Binary files /dev/null and b/model/model/layers/20/input_layernorm/kernel/0 differ diff --git a/model/model/layers/20/mlp/down_proj/kernel/.zarray b/model/model/layers/20/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/20/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/mlp/down_proj/kernel/0.0 b/model/model/layers/20/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a3e43cc448a0c0a07b5de4cad1a76530600f255d --- /dev/null +++ b/model/model/layers/20/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d51402fe9fc340b42795285df199e1439808913bf16c07579a8b3746a50c308 +size 9797284 diff --git a/model/model/layers/20/mlp/down_proj/kernel/0.1 b/model/model/layers/20/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..025dbf96c94b08b71bc3cc7c642ea384c16ebab0 --- /dev/null +++ b/model/model/layers/20/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cca1a0075e6891e484b09ace59905fe6aa6ab5c9b1ee35797b6ecc3b5533096b +size 9798924 diff --git a/model/model/layers/20/mlp/down_proj/kernel/0.2 b/model/model/layers/20/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..c3f07a2762f1cf9fc82b708592812444da272841 --- /dev/null +++ b/model/model/layers/20/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03ab6c23764073ea2e91d27f6231aedae8121c51db56f34408b24e2f098f168 +size 9798468 diff --git a/model/model/layers/20/mlp/down_proj/kernel/0.3 b/model/model/layers/20/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f921161b7ad7f74af55eca68bb99acfed57d8516 --- /dev/null +++ b/model/model/layers/20/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcae7a36221c239cac344182540bb4cbab098353045a2c23686231fad216dfda +size 9797469 diff --git a/model/model/layers/20/mlp/gate_proj/kernel/.zarray b/model/model/layers/20/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/20/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/mlp/gate_proj/kernel/0.0 b/model/model/layers/20/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8a33eb6be4c79cb9599ce017f90eed4a725a1eb6 --- /dev/null +++ b/model/model/layers/20/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92a33144808295abd9813703fbd631298e2ba76f4db27a96d3c81022907a6d5 +size 9809410 diff --git a/model/model/layers/20/mlp/gate_proj/kernel/1.0 b/model/model/layers/20/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d5ea858bfbb249c2fb44e9c1f280138688c231f0 --- /dev/null +++ b/model/model/layers/20/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ee80110339528c07204bf8c5c40764d183d4400cc6f2082e005e72445a90ed +size 9809402 diff --git a/model/model/layers/20/mlp/gate_proj/kernel/2.0 b/model/model/layers/20/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b4a2ee33e9f6ddb270625f896596c7d068a65ceb --- /dev/null +++ b/model/model/layers/20/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c68b466a0f0ec1429f79a7f3f040b490b6fc90e02214e4aed6ac83eeb3103c4 +size 9809406 diff --git a/model/model/layers/20/mlp/gate_proj/kernel/3.0 b/model/model/layers/20/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6ceddb648306328e381674f912bb745009c67191 --- /dev/null +++ b/model/model/layers/20/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a1689e1a0b894c3c8f11532edb438fa5717d047ef8d6a8a1b17a225cc61fdc +size 9809789 diff --git a/model/model/layers/20/mlp/up_proj/kernel/.zarray b/model/model/layers/20/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/20/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/mlp/up_proj/kernel/0.0 b/model/model/layers/20/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9e2176b10dfb6284fee578470a0b7f5d2bd86a8a --- /dev/null +++ b/model/model/layers/20/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4c7866ee213bfd3a268c692f003ac4a9d7a429dd4f9f998e8eb2d786a5b6e3 +size 9792047 diff --git a/model/model/layers/20/mlp/up_proj/kernel/1.0 b/model/model/layers/20/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c8fb314c481fa295f8db0f5ca1cccce32e08c01b --- /dev/null +++ b/model/model/layers/20/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94daa5a3d077992d3f0faba61b7b9f3336bb34a4cb6f41d15b529d19d8703162 +size 9791773 diff --git a/model/model/layers/20/mlp/up_proj/kernel/2.0 b/model/model/layers/20/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..751a1cbb73b58e1a0450b8676988db36be9f60d9 --- /dev/null +++ b/model/model/layers/20/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f906caf8f33f362564fba84849df4fb07a712dac4d4b0c0c62ebdc3488be28f8 +size 9792280 diff --git a/model/model/layers/20/mlp/up_proj/kernel/3.0 b/model/model/layers/20/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..90ccd806d1c692d9c4808e28b708561643bb7a4e --- /dev/null +++ b/model/model/layers/20/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beddac6607fe56b31d351a9098aa03251e7717ad64effcb854115f51fd3422e6 +size 9792105 diff --git a/model/model/layers/20/post_attention_layernorm/kernel/.zarray b/model/model/layers/20/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/20/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/post_attention_layernorm/kernel/0 b/model/model/layers/20/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ba1202924ee8a3068bdabfd3d1d5350f4c1c5b94 Binary files /dev/null and b/model/model/layers/20/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/20/self_attn/k_proj/kernel/.zarray b/model/model/layers/20/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/20/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/self_attn/k_proj/kernel/0.0 b/model/model/layers/20/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f1065005d3e58bdd6ba3b2a6b1cd2c26cc1235f1 --- /dev/null +++ b/model/model/layers/20/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc26dff9a5e5c395ef784ea0ba358f6c28d78846787579ed3903e0d9710d72d +size 1233101 diff --git a/model/model/layers/20/self_attn/k_proj/kernel/1.0 b/model/model/layers/20/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0d120be77093f9a3400ec6ea4ff6e5e65202aa72 --- /dev/null +++ b/model/model/layers/20/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc503d9ac3fad4b4a1df69e5bb6e84ab9fdd2109937fef0d293d6690342b6df +size 1232785 diff --git a/model/model/layers/20/self_attn/k_proj/kernel/2.0 b/model/model/layers/20/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..73e472f4343a77648fe30e21def2e1e48689b88e --- /dev/null +++ b/model/model/layers/20/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40dbdce06811f0058c85c3141d240427703c32b23ab11cfe0cbf6d1f30021341 +size 1232780 diff --git a/model/model/layers/20/self_attn/k_proj/kernel/3.0 b/model/model/layers/20/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0db6f0b8f77cf706880afb12e5ade12daabf6729 --- /dev/null +++ b/model/model/layers/20/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a325073c322ac0362506dcb295457198ee5abcb520111cd92d2e010af48ffece +size 1232732 diff --git a/model/model/layers/20/self_attn/o_proj/kernel/.zarray b/model/model/layers/20/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/20/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/self_attn/o_proj/kernel/0.0 b/model/model/layers/20/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9bb1eaf20f5ec11758f8294f401eb73c73ab7444 --- /dev/null +++ b/model/model/layers/20/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ca3e0af8bc11a5298923b2cfe8758265073d73c7129e3c8cb053cdc37604e3 +size 3667511 diff --git a/model/model/layers/20/self_attn/o_proj/kernel/0.1 b/model/model/layers/20/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..2553b965462383d3febb130fc68ce44cdfaf44ee --- /dev/null +++ b/model/model/layers/20/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e352f943955416cc7bea95820cf9d897ea9f0eae95190f98961d4a7cc23f1d5c +size 3667367 diff --git a/model/model/layers/20/self_attn/o_proj/kernel/0.2 b/model/model/layers/20/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..28acc5981345baf619346feea75b412312009184 --- /dev/null +++ b/model/model/layers/20/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f9a748ee8c8fd1ccb471b39557904c066555c77f1cb7ce6a5d712720a6d1e7 +size 3667753 diff --git a/model/model/layers/20/self_attn/o_proj/kernel/0.3 b/model/model/layers/20/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..cd381cc7edfa567d00abfeb85ec89578733cd67e --- /dev/null +++ b/model/model/layers/20/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae632b6f92cfd646ea59fab846a1587fecdad37033caf30ac9929a6abf33622c +size 3667477 diff --git a/model/model/layers/20/self_attn/q_proj/kernel/.zarray b/model/model/layers/20/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/20/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/self_attn/q_proj/kernel/0.0 b/model/model/layers/20/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d5f8768c1b5d97a0ad549f8d5caef255d9d65e0 --- /dev/null +++ b/model/model/layers/20/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82dc32355080e509403a6720072ba09d6308876e746443d252964eecf86d7966 +size 3698720 diff --git a/model/model/layers/20/self_attn/q_proj/kernel/1.0 b/model/model/layers/20/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6b6e63f6f0b62b8e620e57b058226649e00e91a7 --- /dev/null +++ b/model/model/layers/20/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5070e8cad92d3a4f8b57e9a8d5634a92ad0b355011b4d8dd99906c900e4d4648 +size 3698322 diff --git a/model/model/layers/20/self_attn/q_proj/kernel/2.0 b/model/model/layers/20/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a25ddb7d36501cd2357b138c634e179352e76ad --- /dev/null +++ b/model/model/layers/20/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee04919bb3a921974da067b6d5aa24d4be655d98495145bf9a6dd80e9af126bb +size 3698498 diff --git a/model/model/layers/20/self_attn/q_proj/kernel/3.0 b/model/model/layers/20/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0f20da70da1041d25b81390d7060e39ccd7225d2 --- /dev/null +++ b/model/model/layers/20/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa0364e2b5d4a73f7131ec0d726d8205accada350c4212bfa750f599daf52dd +size 3698080 diff --git a/model/model/layers/20/self_attn/v_proj/kernel/.zarray b/model/model/layers/20/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/20/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/20/self_attn/v_proj/kernel/0.0 b/model/model/layers/20/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..94386e5fe57cec1910486a56b22bcc6c96da8037 --- /dev/null +++ b/model/model/layers/20/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51a1f82355af08524bdc7434f03f48a7f54e8012c44a89dfb56f50387f4e0a7 +size 1225212 diff --git a/model/model/layers/20/self_attn/v_proj/kernel/1.0 b/model/model/layers/20/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..4d5f3f2520e5b9d4dec872916cd7b7275d34a044 --- /dev/null +++ b/model/model/layers/20/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2e0a6fb38ccd9abb9af8d919d166f7ed4630eb9892a10b4c672b1ff220c5e8 +size 1225121 diff --git a/model/model/layers/20/self_attn/v_proj/kernel/2.0 b/model/model/layers/20/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..eab7d9305461d66793fa7d98c1c8713c4fad0671 --- /dev/null +++ b/model/model/layers/20/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdba36a54035fc4bb8a9f5f4e77be3319a701866213f8554156cd90297516ea9 +size 1225026 diff --git a/model/model/layers/20/self_attn/v_proj/kernel/3.0 b/model/model/layers/20/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..473504e1bee77e7fe847faab07561d9435c4bf5d --- /dev/null +++ b/model/model/layers/20/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfdebf9a089015bc4ae4b77bb03fcaf26f4788d5da9fa77853329529f8f61acd +size 1224535 diff --git a/model/model/layers/21/input_layernorm/kernel/.zarray b/model/model/layers/21/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/21/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/input_layernorm/kernel/0 b/model/model/layers/21/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..422df7fa45e5b1f69ac6ac447ecce15d024a5a2b Binary files /dev/null and b/model/model/layers/21/input_layernorm/kernel/0 differ diff --git a/model/model/layers/21/mlp/down_proj/kernel/.zarray b/model/model/layers/21/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/21/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/mlp/down_proj/kernel/0.0 b/model/model/layers/21/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..454f589f54d033a55608addf5173d6981803f2c4 --- /dev/null +++ b/model/model/layers/21/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c0dc215934fbac591c1d3bb08e6378c7db0c5e0673128376efa80b7f8bc68df +size 9798751 diff --git a/model/model/layers/21/mlp/down_proj/kernel/0.1 b/model/model/layers/21/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..f747043234138574fbcc706a5b7d186df933e64b --- /dev/null +++ b/model/model/layers/21/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be37531f890421575b2ad67cfe3df2461e7599d656d034b05d1dd4a077df353a +size 9798437 diff --git a/model/model/layers/21/mlp/down_proj/kernel/0.2 b/model/model/layers/21/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..f68b08172e532648c1c4ad8b80de8cd94ca32c70 --- /dev/null +++ b/model/model/layers/21/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f49544e79c38f1b932c74b63581ad441008e0b7720615d027690c56533c050f +size 9798953 diff --git a/model/model/layers/21/mlp/down_proj/kernel/0.3 b/model/model/layers/21/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b964421321a0dc73256ebb269cfbcd10b52587ea --- /dev/null +++ b/model/model/layers/21/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0321bf960045fbd4973e00df94ad88a6277d38caaf22dc2ba142dfc3e7669df +size 9796910 diff --git a/model/model/layers/21/mlp/gate_proj/kernel/.zarray b/model/model/layers/21/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/21/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/mlp/gate_proj/kernel/0.0 b/model/model/layers/21/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..70bbe095c4ab511bd2a2d532db753428cb6ded34 --- /dev/null +++ b/model/model/layers/21/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1de3c0c5539393a59ab3ae7174fdfc3fa856c669e6201fd07b8e39fa477d1e9 +size 9809271 diff --git a/model/model/layers/21/mlp/gate_proj/kernel/1.0 b/model/model/layers/21/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec833fa1e81940afe31a1de56658dfc0becafeb1 --- /dev/null +++ b/model/model/layers/21/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003a41ef24fdbf94653ea3145c1ba8fa4ae451a7eecc3a9c6c53b1979def7590 +size 9810243 diff --git a/model/model/layers/21/mlp/gate_proj/kernel/2.0 b/model/model/layers/21/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..4e84477710266ef9c190ef6a97b1a03611827331 --- /dev/null +++ b/model/model/layers/21/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8b3a38721892130f314baa68bcc5e50c3d36b2cab94671d5dd32693c00bdd3 +size 9810700 diff --git a/model/model/layers/21/mlp/gate_proj/kernel/3.0 b/model/model/layers/21/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..bfba502daecae9cd66a759468af0ae467a3d46a1 --- /dev/null +++ b/model/model/layers/21/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc896f839a0799f348c11c2e4c3d40d11ceb04a774794a6d2c7ddb2a27284c3 +size 9810795 diff --git a/model/model/layers/21/mlp/up_proj/kernel/.zarray b/model/model/layers/21/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/21/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/mlp/up_proj/kernel/0.0 b/model/model/layers/21/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..99fc5c05d7efc09422d8e844f3953c390440eaa0 --- /dev/null +++ b/model/model/layers/21/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a0d20d4e447bbe7992c066c015671263722b0c9a9121624d5553e0530d8424 +size 9791060 diff --git a/model/model/layers/21/mlp/up_proj/kernel/1.0 b/model/model/layers/21/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..abd7f96062ba11dedb2b562ccae2fda5c8357ab8 --- /dev/null +++ b/model/model/layers/21/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee30e917987eea4e69d047005ac9326d9c693dc7fcf54d8757e72378a3674709 +size 9791570 diff --git a/model/model/layers/21/mlp/up_proj/kernel/2.0 b/model/model/layers/21/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e491734657af4fbf40373e668fd3b1dfdaeff31c --- /dev/null +++ b/model/model/layers/21/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9825514ca75977fad31ce3491f16333685367d4802f5322759498e5aad806b69 +size 9792423 diff --git a/model/model/layers/21/mlp/up_proj/kernel/3.0 b/model/model/layers/21/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6e93f33d61b752f185eb713c84988787597c4f39 --- /dev/null +++ b/model/model/layers/21/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0c58571b676f8ae98f58190c475c6a86d9a92b83a119e01c8a1c7c957ad60e +size 9791713 diff --git a/model/model/layers/21/post_attention_layernorm/kernel/.zarray b/model/model/layers/21/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/21/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/post_attention_layernorm/kernel/0 b/model/model/layers/21/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..e4954da28002f8509ded8d69e3ef1e67781a30db Binary files /dev/null and b/model/model/layers/21/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/21/self_attn/k_proj/kernel/.zarray b/model/model/layers/21/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/21/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/self_attn/k_proj/kernel/0.0 b/model/model/layers/21/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe68552ace63dd3c53c95a8ece522d3f6c152c45 --- /dev/null +++ b/model/model/layers/21/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c425fcd8df9106f5495fdd316ca5bac3610087cbae90f12acc318901e099bb71 +size 1233391 diff --git a/model/model/layers/21/self_attn/k_proj/kernel/1.0 b/model/model/layers/21/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..dce235820feea0258acb5b5b395e5017e3e224db --- /dev/null +++ b/model/model/layers/21/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62da7f0d8462cbc51b9179ee1a6479c81f34791f8e95a71cf5754d789aaad802 +size 1233744 diff --git a/model/model/layers/21/self_attn/k_proj/kernel/2.0 b/model/model/layers/21/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fb22b184183826e7a5f54599c3fca19f611a36be --- /dev/null +++ b/model/model/layers/21/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4fab19b839fd26738fbadbf0a366e63c22b4a4c2d6b911534fc14c55b0e130 +size 1233920 diff --git a/model/model/layers/21/self_attn/k_proj/kernel/3.0 b/model/model/layers/21/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..de381363c328d18cb7ec70e10c9f5d6c6b650120 --- /dev/null +++ b/model/model/layers/21/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2883cc44dfd3c0e3a657f532c4f8feada373e05e102e4c69a8c3ed3809e642 +size 1233812 diff --git a/model/model/layers/21/self_attn/o_proj/kernel/.zarray b/model/model/layers/21/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/21/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/self_attn/o_proj/kernel/0.0 b/model/model/layers/21/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c044de00c90e4d4a831fbee1c3a02434934acb5e --- /dev/null +++ b/model/model/layers/21/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c17956b2d1bd8607feee24afc6d29cda5e5af2abc92d1e84fe68a16c6447d1 +size 3671470 diff --git a/model/model/layers/21/self_attn/o_proj/kernel/0.1 b/model/model/layers/21/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6f3fa1670fa5c1baa8ecf2a6f61964cc643f2131 --- /dev/null +++ b/model/model/layers/21/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67711b87f6cf7943a4a69192afbb7b5e9baa6da735b444c668324147b2bc7750 +size 3670640 diff --git a/model/model/layers/21/self_attn/o_proj/kernel/0.2 b/model/model/layers/21/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..0a9a124f4833a058ccaaac7f9f010f60e00da2dc --- /dev/null +++ b/model/model/layers/21/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f54aa616d1dbe9176e3d3a501830c116b781f2ec1dec0966b80f18a310947c +size 3671769 diff --git a/model/model/layers/21/self_attn/o_proj/kernel/0.3 b/model/model/layers/21/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..38f762cdc55f7ea36f5dcd6b2b9929599cfcc7cb --- /dev/null +++ b/model/model/layers/21/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88155a77acd730a90b973b4204b24e97f25538d0c821dd217b41ca7d5fc5affa +size 3670941 diff --git a/model/model/layers/21/self_attn/q_proj/kernel/.zarray b/model/model/layers/21/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/21/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/self_attn/q_proj/kernel/0.0 b/model/model/layers/21/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..31f64981e5888998a1e47c8b036ae551029ce1ef --- /dev/null +++ b/model/model/layers/21/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f70292c71fa52ebbc8a82c843beaa54cdb748764140b70d3ad14c92ab9ea4106 +size 3701589 diff --git a/model/model/layers/21/self_attn/q_proj/kernel/1.0 b/model/model/layers/21/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..39e962ff56355f8c2a9a9e498df886fd2de199ce --- /dev/null +++ b/model/model/layers/21/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5c6deead3f09776ea3c3cbeb2ecfd80b4db2fcabb6834e35e977b85fbd7962b +size 3701729 diff --git a/model/model/layers/21/self_attn/q_proj/kernel/2.0 b/model/model/layers/21/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d06bf502a4154843100b2eb52a1b14b8e6beb783 --- /dev/null +++ b/model/model/layers/21/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24147156a6cc7b30a8cc768fea5f8587b651c787c7bd183b9f4a7ce7b2f4cc7d +size 3701477 diff --git a/model/model/layers/21/self_attn/q_proj/kernel/3.0 b/model/model/layers/21/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..324039de32b4e46410630f6dff7db09f9e8b5ebc --- /dev/null +++ b/model/model/layers/21/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34afaf7d0e22464f3d739b7924d9259ffe5ec2992bd6220ec5e5ac180c94d9db +size 3701513 diff --git a/model/model/layers/21/self_attn/v_proj/kernel/.zarray b/model/model/layers/21/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/21/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/21/self_attn/v_proj/kernel/0.0 b/model/model/layers/21/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e2deb222e88ccca14ed5a7ef5f563cec731af373 --- /dev/null +++ b/model/model/layers/21/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33fac36274ddcb9fe8c49f1fd88937cc89d139c590e6c64b95313328799fa76 +size 1228017 diff --git a/model/model/layers/21/self_attn/v_proj/kernel/1.0 b/model/model/layers/21/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6d9f344d6d31aee6580a09cfacbf47ebb35e2882 --- /dev/null +++ b/model/model/layers/21/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700af5ed4014e58deaeb1476221319f39fca3a4be115e06fdfd0a989a550ecac +size 1228810 diff --git a/model/model/layers/21/self_attn/v_proj/kernel/2.0 b/model/model/layers/21/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f1c9890f4151fac7977a564a5b6dac906b6d4da1 --- /dev/null +++ b/model/model/layers/21/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79705ecd2a01d4110d388fb336f4a514f0dc7109015aa906b5271b8935f4756 +size 1228397 diff --git a/model/model/layers/21/self_attn/v_proj/kernel/3.0 b/model/model/layers/21/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..85652fc15e64fb54fa510d852ed188a04e3e5269 --- /dev/null +++ b/model/model/layers/21/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e7231d06d613ec2cfee8a666a7a1160922bfdf2c8661883130871260b99e1a +size 1227982 diff --git a/model/model/layers/22/input_layernorm/kernel/.zarray b/model/model/layers/22/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/22/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/input_layernorm/kernel/0 b/model/model/layers/22/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..5298fb1751e75a4cd1a735a13772b165d61f8399 Binary files /dev/null and b/model/model/layers/22/input_layernorm/kernel/0 differ diff --git a/model/model/layers/22/mlp/down_proj/kernel/.zarray b/model/model/layers/22/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/22/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/mlp/down_proj/kernel/0.0 b/model/model/layers/22/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5858818e6ef69aaa90eb5da2943c9c6ef0b3ef9 --- /dev/null +++ b/model/model/layers/22/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bae1359b6b21d94aeb97af5ebc6bdcec3f8e238358807757baa2fe0498e0d8e +size 9799171 diff --git a/model/model/layers/22/mlp/down_proj/kernel/0.1 b/model/model/layers/22/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fab570502cbffd76970af65bd5c4cd57394cb9dc --- /dev/null +++ b/model/model/layers/22/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:271f6b40bc7845c9d2095bc514d9d7070abfc291767c499aeb981b41b1a2d6ef +size 9800390 diff --git a/model/model/layers/22/mlp/down_proj/kernel/0.2 b/model/model/layers/22/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..cd19925db94e061f19f98f8348e4fac4e1b9cacf --- /dev/null +++ b/model/model/layers/22/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ee803e456f76dbf077aa0fd0087eac9dd6d049925ab4bf4cb0a3646be6b190 +size 9799251 diff --git a/model/model/layers/22/mlp/down_proj/kernel/0.3 b/model/model/layers/22/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..4f796a4c4a38bae0621bf3ab320a5763b0cce92f --- /dev/null +++ b/model/model/layers/22/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde961b4cba4c49957e0e57acb887cd315e3db1c9ce6b097fc6236badda3e79e +size 9798283 diff --git a/model/model/layers/22/mlp/gate_proj/kernel/.zarray b/model/model/layers/22/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/22/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/mlp/gate_proj/kernel/0.0 b/model/model/layers/22/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..53962d5b0dfaa85efa7fa28c2a6a2a5801225fe7 --- /dev/null +++ b/model/model/layers/22/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5077faeabcf58f53d2c18a3bee976aa82cf412b47ccb1c3317bbf5ec062c0e9 +size 9811639 diff --git a/model/model/layers/22/mlp/gate_proj/kernel/1.0 b/model/model/layers/22/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e6ba3c49965c2f4a85cf4d2b9dd6488f2f73682f --- /dev/null +++ b/model/model/layers/22/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0692b2643a256129990bb27dc703a96353a22a9e32116b7b441672b7df4699ef +size 9811796 diff --git a/model/model/layers/22/mlp/gate_proj/kernel/2.0 b/model/model/layers/22/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..84ddd012a31c4308b332e8eb1a4884448797abcc --- /dev/null +++ b/model/model/layers/22/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d08acdddf325b7857dd6ed808c25eba07e446b287e26a55f664f72ceb4ba8c +size 9811823 diff --git a/model/model/layers/22/mlp/gate_proj/kernel/3.0 b/model/model/layers/22/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac9e608635816f66d4e25d619bbebd7117f2dad5 --- /dev/null +++ b/model/model/layers/22/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e93b44e6e59c54612f268495d31b56479246d4603558db6c0f63a236526dba6 +size 9811895 diff --git a/model/model/layers/22/mlp/up_proj/kernel/.zarray b/model/model/layers/22/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/22/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/mlp/up_proj/kernel/0.0 b/model/model/layers/22/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b1e49958f2cf8ffe736db2b638963c274ef5feb4 --- /dev/null +++ b/model/model/layers/22/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1195d147ffa7fbf3f988e8bf5825d17713cbd1c385af3e40302ce5c5aca397ae +size 9792338 diff --git a/model/model/layers/22/mlp/up_proj/kernel/1.0 b/model/model/layers/22/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9470cffa9dc8b13060adef3f4e85cca65a5f30a0 --- /dev/null +++ b/model/model/layers/22/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6535ab28ac2318b5e63a6a66f105cafd3ee564c9e756dc4acb0665ca3fcfef22 +size 9792159 diff --git a/model/model/layers/22/mlp/up_proj/kernel/2.0 b/model/model/layers/22/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5e7f9701c7a6563aecc40124a00da63230f6ee7 --- /dev/null +++ b/model/model/layers/22/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59e0591af228ba0817f590530fafa1854320dbf376566472984cf75f19a1dea +size 9792439 diff --git a/model/model/layers/22/mlp/up_proj/kernel/3.0 b/model/model/layers/22/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cb8a8586bb00b46ed344210e0aa09938c20ef7e5 --- /dev/null +++ b/model/model/layers/22/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5da70a37757aa2b375e717dc311c5835a3bf4087b2c415a4eab6db53d73921c4 +size 9792232 diff --git a/model/model/layers/22/post_attention_layernorm/kernel/.zarray b/model/model/layers/22/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/22/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/post_attention_layernorm/kernel/0 b/model/model/layers/22/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..a2be38562fb34e0cb77990edf3b116999399ce5b Binary files /dev/null and b/model/model/layers/22/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/22/self_attn/k_proj/kernel/.zarray b/model/model/layers/22/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/22/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/self_attn/k_proj/kernel/0.0 b/model/model/layers/22/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a2d0e51cdf4009549a6889ed892bcd07dd2d3ab4 --- /dev/null +++ b/model/model/layers/22/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8db0ca6ea7221b88289795b65744ff3d31a882a41c0a9bba706c4417696fc401 +size 1236212 diff --git a/model/model/layers/22/self_attn/k_proj/kernel/1.0 b/model/model/layers/22/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a6d0f895800b7240110e7d5b6cc728de7d8da66 --- /dev/null +++ b/model/model/layers/22/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e196180d56f531a1705a67762870086fc39c2929cb14f2623b508cb86b65c6 +size 1236083 diff --git a/model/model/layers/22/self_attn/k_proj/kernel/2.0 b/model/model/layers/22/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..65178adeb5caf6a65a4fff9fb87c3af59c10ced5 --- /dev/null +++ b/model/model/layers/22/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a2e212215de9fa8f3ea1f7f105ce0e972182338ddc0207c06c81f931ad8af1 +size 1236216 diff --git a/model/model/layers/22/self_attn/k_proj/kernel/3.0 b/model/model/layers/22/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3d733b798ec7ebd227f8128408379e7b44ad3866 --- /dev/null +++ b/model/model/layers/22/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c5de1536ef926bac8b553fa5c381c449783d87328ab6aa829ada338067cd94 +size 1236139 diff --git a/model/model/layers/22/self_attn/o_proj/kernel/.zarray b/model/model/layers/22/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/22/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/self_attn/o_proj/kernel/0.0 b/model/model/layers/22/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..eeac718d9d3ceedc0791ac758dc4d9ce149f7860 --- /dev/null +++ b/model/model/layers/22/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd36ebe957c677b5383610777618183df15d95b40d0c8114ed38a79fedbe8b7 +size 3671805 diff --git a/model/model/layers/22/self_attn/o_proj/kernel/0.1 b/model/model/layers/22/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..013bde36bbb8da39c470790008ee09aea1342fb0 --- /dev/null +++ b/model/model/layers/22/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:422bbaf1840c08c5c0693b496ec32f82e1d1e4b2634478a0333d3d614ca91d9e +size 3671327 diff --git a/model/model/layers/22/self_attn/o_proj/kernel/0.2 b/model/model/layers/22/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..5fd1a2b66dfa9852f0bc29b4da4e343ebd39d762 --- /dev/null +++ b/model/model/layers/22/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5eacba49bee5ba6214ebb0d4e8fbc7803c788ae69d70cbd07030c6c9f2a6cb3 +size 3672699 diff --git a/model/model/layers/22/self_attn/o_proj/kernel/0.3 b/model/model/layers/22/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..7d4622e197d352ebd6be1a3dc47810ae460bb050 --- /dev/null +++ b/model/model/layers/22/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce40045098dc0d89f77cfbf2007b057f4a5a5254d80f49f79dfb6a9f3d9d909 +size 3671311 diff --git a/model/model/layers/22/self_attn/q_proj/kernel/.zarray b/model/model/layers/22/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/22/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/self_attn/q_proj/kernel/0.0 b/model/model/layers/22/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d42c52cb17fcc0ca8ee9ee4b2175d0fba4a0e423 --- /dev/null +++ b/model/model/layers/22/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a33bee66602533434854af86ade0b2a7e00041c719e513144b56cb55ca53ba1 +size 3694498 diff --git a/model/model/layers/22/self_attn/q_proj/kernel/1.0 b/model/model/layers/22/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1a50f7491b8ecf392bd6e78bacadfbbab7aad63e --- /dev/null +++ b/model/model/layers/22/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61628b7ea5b4fcb7ae57c0ef498430339cdff6a320e2e0720d4e381147eeeaec +size 3694890 diff --git a/model/model/layers/22/self_attn/q_proj/kernel/2.0 b/model/model/layers/22/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e51fbe17c2555a61cd9b256513242d1df03c2736 --- /dev/null +++ b/model/model/layers/22/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c672bff319fe30e0fa5292b837bfafce8ba75af28b5e6bb540bbf9b54c2eff87 +size 3694343 diff --git a/model/model/layers/22/self_attn/q_proj/kernel/3.0 b/model/model/layers/22/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..18ef45da84deac478b0ccc5a857a9ec83799f6b4 --- /dev/null +++ b/model/model/layers/22/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94fd1a8d2ad3d3891b3de53a6a8a576ab650c5c0a5449aa84db6eac46d11945c +size 3694749 diff --git a/model/model/layers/22/self_attn/v_proj/kernel/.zarray b/model/model/layers/22/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/22/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/22/self_attn/v_proj/kernel/0.0 b/model/model/layers/22/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9403c1324f5879108da8555aa75da0cb93ace3d6 --- /dev/null +++ b/model/model/layers/22/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844220d129b003e6320ba1a454e6524e4760df22fd35000a7ced1ca58199e18e +size 1226618 diff --git a/model/model/layers/22/self_attn/v_proj/kernel/1.0 b/model/model/layers/22/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b512b73264d77c1983252315e29a0830415daa67 --- /dev/null +++ b/model/model/layers/22/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45688370dfc61d1de7299b8fab478a7283309ec8708cca922290a6998d339690 +size 1226877 diff --git a/model/model/layers/22/self_attn/v_proj/kernel/2.0 b/model/model/layers/22/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..94afa92503310270e420605c4ab1429dba58d5c9 --- /dev/null +++ b/model/model/layers/22/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd8eb3e46ff2bde163e8ddc39e25722c27e64e5f477bf9e3c258b3a7094fe3c +size 1226726 diff --git a/model/model/layers/22/self_attn/v_proj/kernel/3.0 b/model/model/layers/22/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..7203c7e6891a64dea0cdb1bf28773859f5570b2f --- /dev/null +++ b/model/model/layers/22/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4501cfcc143e55947d46f1bf8a96e95a7433dac238342fc66ccb60c873a847ee +size 1226045 diff --git a/model/model/layers/23/input_layernorm/kernel/.zarray b/model/model/layers/23/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/23/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/input_layernorm/kernel/0 b/model/model/layers/23/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..569da79fc1ecd0cc39adfe48d61ec453e01138bb Binary files /dev/null and b/model/model/layers/23/input_layernorm/kernel/0 differ diff --git a/model/model/layers/23/mlp/down_proj/kernel/.zarray b/model/model/layers/23/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/23/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/mlp/down_proj/kernel/0.0 b/model/model/layers/23/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f4e6dad0d8947305568c79e4750d7dbc829c36c3 --- /dev/null +++ b/model/model/layers/23/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7eacedaa9d869aefb88858a67064b90cc6e09968785c28fe4a6bc324fea6436 +size 9801116 diff --git a/model/model/layers/23/mlp/down_proj/kernel/0.1 b/model/model/layers/23/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..706829ed889805ecad916cbb89dab065d602c9e6 --- /dev/null +++ b/model/model/layers/23/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87635cebef73a8b6a53e4722bcb1ed77816f0ad0f192aa724d0c5ebd679f158 +size 9803249 diff --git a/model/model/layers/23/mlp/down_proj/kernel/0.2 b/model/model/layers/23/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ebc88f7c0b71d06066fc59aaf21b2aa03f10e776 --- /dev/null +++ b/model/model/layers/23/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8108773d09665b0b502b80317811db078e1968c4b34de14ccb3693f8691e811 +size 9803131 diff --git a/model/model/layers/23/mlp/down_proj/kernel/0.3 b/model/model/layers/23/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..61c403bc41934c033b6f14533d5cbc53870f016d --- /dev/null +++ b/model/model/layers/23/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702cd6a4a26d921d9f86cfd0af5b1577bc526ba29e28dd45be4763bf32633f97 +size 9801321 diff --git a/model/model/layers/23/mlp/gate_proj/kernel/.zarray b/model/model/layers/23/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/23/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/mlp/gate_proj/kernel/0.0 b/model/model/layers/23/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6190efdb2661db80a0541a77696200155d2aedb6 --- /dev/null +++ b/model/model/layers/23/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21f610374ca5c464d9c85e3e3d8966013e1e90f5f021da4718ac43eddb64f78 +size 9817041 diff --git a/model/model/layers/23/mlp/gate_proj/kernel/1.0 b/model/model/layers/23/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..33a7285cc338a552552d7f340d414a98225f0cb6 --- /dev/null +++ b/model/model/layers/23/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf44e71b4b325ad40ea7751d946278885d97fd981d3401dfddc4b05f08a0582c +size 9817247 diff --git a/model/model/layers/23/mlp/gate_proj/kernel/2.0 b/model/model/layers/23/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..630c7e924b9fd953dd43fff30ae0c39f58d27124 --- /dev/null +++ b/model/model/layers/23/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78e32b861f0e31e4165813401884f2d5d205da4d99d738f5bb60836d970432af +size 9816447 diff --git a/model/model/layers/23/mlp/gate_proj/kernel/3.0 b/model/model/layers/23/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b7168ff4952364bbdc2430d2306c8ebee648f33c --- /dev/null +++ b/model/model/layers/23/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f09ebffe411a6f5ebe4b7ee74c9b01604407a35f9e8e0988ff88cbe06334e9 +size 9815796 diff --git a/model/model/layers/23/mlp/up_proj/kernel/.zarray b/model/model/layers/23/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/23/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/mlp/up_proj/kernel/0.0 b/model/model/layers/23/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6676a014292613cfd14c66038ee59478cc6f85e9 --- /dev/null +++ b/model/model/layers/23/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf0ea9b89a77795a74dba61ac3e75840f3a3332267b72fd0b5045384df1f1cf +size 9791778 diff --git a/model/model/layers/23/mlp/up_proj/kernel/1.0 b/model/model/layers/23/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..279bd5e463e73f3c3f97971ef76d684dc1f281ee --- /dev/null +++ b/model/model/layers/23/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17b3ef6a02f3ce372cf30306f67f7c24b2d2c1b130e073e8432fb52b74ee3a8c +size 9792761 diff --git a/model/model/layers/23/mlp/up_proj/kernel/2.0 b/model/model/layers/23/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f2b80524da0a5716d34ff4bb7f210ea7d871449d --- /dev/null +++ b/model/model/layers/23/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a93ef6ea8ed07493c62ba76b676c69ecb064f77d6bf93a8af76768f1a5f7a9a +size 9792360 diff --git a/model/model/layers/23/mlp/up_proj/kernel/3.0 b/model/model/layers/23/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e5e422065f695adac5bbd3f104f22d8ed363caa2 --- /dev/null +++ b/model/model/layers/23/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1582df303050e68757289415d78da0dc09bebf909ab388d00fd99afe14f20587 +size 9792055 diff --git a/model/model/layers/23/post_attention_layernorm/kernel/.zarray b/model/model/layers/23/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/23/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/post_attention_layernorm/kernel/0 b/model/model/layers/23/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f9e5cab29d6da054adf5096396e53e7e659aeaa8 Binary files /dev/null and b/model/model/layers/23/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/23/self_attn/k_proj/kernel/.zarray b/model/model/layers/23/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/23/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/self_attn/k_proj/kernel/0.0 b/model/model/layers/23/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7ef7a09076ea02e36a737d0ca7d13ec3956ec84a --- /dev/null +++ b/model/model/layers/23/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4827f9b7576ffa13e1c9749b7533c1e3353c411fc2502374161c44f3681ad383 +size 1234467 diff --git a/model/model/layers/23/self_attn/k_proj/kernel/1.0 b/model/model/layers/23/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a6532a699721d4bde9efdcf0de758c922516b6bd --- /dev/null +++ b/model/model/layers/23/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b500883279bae5b1a64bc5a384f1fb25635090cfb313a01379b409eb31c54ec +size 1234556 diff --git a/model/model/layers/23/self_attn/k_proj/kernel/2.0 b/model/model/layers/23/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3d1e548741c55622b4b4904de5ea77157e8504f5 --- /dev/null +++ b/model/model/layers/23/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e96cfa4b9c71e70152acf1aac5fc45aad6c3144567e611b804d9885e3a3a1f5 +size 1234443 diff --git a/model/model/layers/23/self_attn/k_proj/kernel/3.0 b/model/model/layers/23/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f7f7085f54e44163a6442d462b99b3c51ac5a3c --- /dev/null +++ b/model/model/layers/23/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e433a5dea52282280e92c7aa1945fdf4b0a2e08ec8e4c5cc259ef51249549f +size 1234227 diff --git a/model/model/layers/23/self_attn/o_proj/kernel/.zarray b/model/model/layers/23/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/23/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/self_attn/o_proj/kernel/0.0 b/model/model/layers/23/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..630905347f3ada054d7fcab4fcef781a770a9087 --- /dev/null +++ b/model/model/layers/23/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db4d2c18a5d1c8ef3f7733aa9e03e89c6dbd65363a5db5197b84a306a22a2fa6 +size 3672541 diff --git a/model/model/layers/23/self_attn/o_proj/kernel/0.1 b/model/model/layers/23/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1a756303a22b0b6f76ce14d0457c88a69535fa17 --- /dev/null +++ b/model/model/layers/23/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c970ad0ffa8b64259351e58443c37aae17a629d84ee091d13494023db6dae6 +size 3672351 diff --git a/model/model/layers/23/self_attn/o_proj/kernel/0.2 b/model/model/layers/23/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b72c6b044f88efa20aea293ac911c7abe4b65a78 --- /dev/null +++ b/model/model/layers/23/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f255a90117935f0918dad39d6cb08469b645b3c6081d141b55cea27e5b00600c +size 3672894 diff --git a/model/model/layers/23/self_attn/o_proj/kernel/0.3 b/model/model/layers/23/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e8e4bb2d98edf873ac4e905ffde288c946a6b18d --- /dev/null +++ b/model/model/layers/23/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3564ab802a006591b4c234c703744bc7177ab0f42ef7b745f4ea8b3db84b1e +size 3671811 diff --git a/model/model/layers/23/self_attn/q_proj/kernel/.zarray b/model/model/layers/23/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/23/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/self_attn/q_proj/kernel/0.0 b/model/model/layers/23/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..587d86ff3f90e7d49768bbea05082c5fd78d73df --- /dev/null +++ b/model/model/layers/23/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487d9b2e8979b91afbff7f0a0d7583d9bbb8083e3ab39e85c743a80370e4d33b +size 3696405 diff --git a/model/model/layers/23/self_attn/q_proj/kernel/1.0 b/model/model/layers/23/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b55acc4dd6a5fcce194f4a5fa11d48032a5ef311 --- /dev/null +++ b/model/model/layers/23/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf23f32e5a469a47b44e8e9ed2bf5b513be9cd5391db09cfd7fe1995cb7f4cd5 +size 3696394 diff --git a/model/model/layers/23/self_attn/q_proj/kernel/2.0 b/model/model/layers/23/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d581339fe0e3c3fd135b40355fb4afabb5dc8d4e --- /dev/null +++ b/model/model/layers/23/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20cc28ed955e0f7d90e9b7311f2d5dc42935fc67a1e5f6b35889e87147ea591e +size 3695997 diff --git a/model/model/layers/23/self_attn/q_proj/kernel/3.0 b/model/model/layers/23/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..dd4e8e4f3bbb137b86397df1a2fc224dc707ec13 --- /dev/null +++ b/model/model/layers/23/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5dfb88ad2d9108dbdb376c7b727646c533e2e0c00b98e0ea2041ba5ee0e7d0d +size 3695982 diff --git a/model/model/layers/23/self_attn/v_proj/kernel/.zarray b/model/model/layers/23/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/23/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/23/self_attn/v_proj/kernel/0.0 b/model/model/layers/23/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f2af3c1bfffd86c1e2b00d2b1f73aa5fca825b68 --- /dev/null +++ b/model/model/layers/23/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae437304b115cddedd6656cc4851aa2185b3ce8cf052d61d3012db2bf06031c +size 1228178 diff --git a/model/model/layers/23/self_attn/v_proj/kernel/1.0 b/model/model/layers/23/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..42eceaab930fe602beff997c999cb90391172669 --- /dev/null +++ b/model/model/layers/23/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38af86d35140203c8b80a2401fa28e0f6121adc483f4589f86ec0234746b6b62 +size 1228474 diff --git a/model/model/layers/23/self_attn/v_proj/kernel/2.0 b/model/model/layers/23/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..57d341b664c399fe133221623608d21941278425 --- /dev/null +++ b/model/model/layers/23/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13421c92ce48bc8cc1f1cc0d5fe6b10fbbea8085b9e515412c05cd70a611f2a8 +size 1228394 diff --git a/model/model/layers/23/self_attn/v_proj/kernel/3.0 b/model/model/layers/23/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9e1d46dc73c9bab5901c5d9b2e4aaa80f6e4f801 --- /dev/null +++ b/model/model/layers/23/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325740c9feb00054b17cc9b34bd7c67048f6899c105047ab6bf0921844d802fe +size 1227598 diff --git a/model/model/layers/24/input_layernorm/kernel/.zarray b/model/model/layers/24/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/24/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/input_layernorm/kernel/0 b/model/model/layers/24/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..1fe1fb8c57060a46b7ff7b1bef0e5d768938bca4 Binary files /dev/null and b/model/model/layers/24/input_layernorm/kernel/0 differ diff --git a/model/model/layers/24/mlp/down_proj/kernel/.zarray b/model/model/layers/24/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/24/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/mlp/down_proj/kernel/0.0 b/model/model/layers/24/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e12a5d390c836b3e876506bb34f49e3dfe03c99c --- /dev/null +++ b/model/model/layers/24/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0848e2046670c6ac8fbf7978c39677b1e171a71ee830d324bc93da9bf617c16 +size 9803869 diff --git a/model/model/layers/24/mlp/down_proj/kernel/0.1 b/model/model/layers/24/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..8cc04ba5b3babfbe498a707c2c923c3ecc14ec36 --- /dev/null +++ b/model/model/layers/24/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa96b47628c74eac2fe42220f986ee6e11bdb04f9157a1625d48eb9973ebe287 +size 9804570 diff --git a/model/model/layers/24/mlp/down_proj/kernel/0.2 b/model/model/layers/24/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..800ed7f5196611cc8ec95b8e3c8ed9f05a40b39d --- /dev/null +++ b/model/model/layers/24/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510eecdedb3a7caa6eb56f30582de0358c1dd32b3e71ca2b5dc051fd09c3bde0 +size 9803825 diff --git a/model/model/layers/24/mlp/down_proj/kernel/0.3 b/model/model/layers/24/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0c202ace327791a210ce8749931b520908537dc7 --- /dev/null +++ b/model/model/layers/24/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f505fc9da8421d9e7ad1065c1308dc1d10182e5e75aca009269e6222999345ef +size 9802360 diff --git a/model/model/layers/24/mlp/gate_proj/kernel/.zarray b/model/model/layers/24/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/24/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/mlp/gate_proj/kernel/0.0 b/model/model/layers/24/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c63019ee9dff1df2e26f6f2f6837e8d614601f04 --- /dev/null +++ b/model/model/layers/24/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4990abb283d88229c3b3286fe365f5029e303e295c853a0cdbc0f3db4aca2a7e +size 9820559 diff --git a/model/model/layers/24/mlp/gate_proj/kernel/1.0 b/model/model/layers/24/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..84b17e5bd98efcfe34a4262f8d2979c609f7bab6 --- /dev/null +++ b/model/model/layers/24/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:825c158bb6948a4aea3514938b772fe156acf18e7f19c46f0e0a558696f34937 +size 9820695 diff --git a/model/model/layers/24/mlp/gate_proj/kernel/2.0 b/model/model/layers/24/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8b6631e03e3c6fbddfe2b3b17f73a50cf25907d6 --- /dev/null +++ b/model/model/layers/24/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff320ebce8461b0bf996fd1797d9f5804c77a6e2861a23bad03efaf083f6d402 +size 9821669 diff --git a/model/model/layers/24/mlp/gate_proj/kernel/3.0 b/model/model/layers/24/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..27f930dfbe374b4376d8108e47ad4ace79aea9e5 --- /dev/null +++ b/model/model/layers/24/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5cefc526b0545912df1e9ae7a90bfafc400e65e99fe180881bfde33be7fc23c +size 9820802 diff --git a/model/model/layers/24/mlp/up_proj/kernel/.zarray b/model/model/layers/24/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/24/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/mlp/up_proj/kernel/0.0 b/model/model/layers/24/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e8cdf2186815cf1c540b7b7aeaf8d77e9737d3ef --- /dev/null +++ b/model/model/layers/24/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc39d37da445dc92e4298d351a7edfc2384ceb37c6e28271519b6d2533b02d5 +size 9792805 diff --git a/model/model/layers/24/mlp/up_proj/kernel/1.0 b/model/model/layers/24/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..509782c93188cf9106179dabbba459a60cec46fc --- /dev/null +++ b/model/model/layers/24/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd89bfdbf0a75bb8edd8ade4bccdd26fed78fd47bcf9d56ffdbde6b10535a4f +size 9792210 diff --git a/model/model/layers/24/mlp/up_proj/kernel/2.0 b/model/model/layers/24/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..686251419c911396f0f89fdce8b34a8f187f2f81 --- /dev/null +++ b/model/model/layers/24/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f418dc03cf135803d35d004ec5d9ba8d18e85ca1e701db63f48069ffe2173ed +size 9793016 diff --git a/model/model/layers/24/mlp/up_proj/kernel/3.0 b/model/model/layers/24/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f0875d7451bac2e29ca037677911e8258ad0a361 --- /dev/null +++ b/model/model/layers/24/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323d4f7c65b7d070262e1c512341d8c31dc7674870a94a18aabf8efefd7b5ebf +size 9792070 diff --git a/model/model/layers/24/post_attention_layernorm/kernel/.zarray b/model/model/layers/24/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/24/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/post_attention_layernorm/kernel/0 b/model/model/layers/24/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ada14cf2325509b1669ffaad876e98a71dc1bce0 Binary files /dev/null and b/model/model/layers/24/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/24/self_attn/k_proj/kernel/.zarray b/model/model/layers/24/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/24/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/self_attn/k_proj/kernel/0.0 b/model/model/layers/24/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e31885ad72443564315f73fa8023a6cdf1381b31 --- /dev/null +++ b/model/model/layers/24/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e204b74cda37222cee6ef00006b4bed6a14e707bb014154bbb495aad6999550d +size 1235355 diff --git a/model/model/layers/24/self_attn/k_proj/kernel/1.0 b/model/model/layers/24/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c8fb8a1b12ae8fa4735e826f6b2a7aa6c5afaaf9 --- /dev/null +++ b/model/model/layers/24/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29cf59c69f9230ac566c9468ceae006d655bcc3df27ab21e949fb8f3862c4364 +size 1235612 diff --git a/model/model/layers/24/self_attn/k_proj/kernel/2.0 b/model/model/layers/24/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8bbda9340a3d51a713c2fea21a4d53ccd246ac8c --- /dev/null +++ b/model/model/layers/24/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3816df01b28b8ef88aa5291ccde0722c0a0f8df72570a53e1d201f1d6daa766 +size 1235486 diff --git a/model/model/layers/24/self_attn/k_proj/kernel/3.0 b/model/model/layers/24/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f4e6a801c36455ea55d46fa6e8257ac06bdda349 --- /dev/null +++ b/model/model/layers/24/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44164268f6296429b2245e56162f38a6e30078167012de30f11e791e971a1336 +size 1235324 diff --git a/model/model/layers/24/self_attn/o_proj/kernel/.zarray b/model/model/layers/24/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/24/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/self_attn/o_proj/kernel/0.0 b/model/model/layers/24/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe61fafbc904148bdad58d777c3fdd1ac929e7ee --- /dev/null +++ b/model/model/layers/24/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e5a1aed8f7df13b149ac9d3c60be2a13c7c863398fde18c66d5897aa7c38b51 +size 3672732 diff --git a/model/model/layers/24/self_attn/o_proj/kernel/0.1 b/model/model/layers/24/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..92976be7b6163a8c29c5a6d5c72434545cf9a1ce --- /dev/null +++ b/model/model/layers/24/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:342714788c5e5b7fc19fca9ffa19f5b25df255713aaa1fc1405097391f374780 +size 3673031 diff --git a/model/model/layers/24/self_attn/o_proj/kernel/0.2 b/model/model/layers/24/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..5d4b0a544c2a08fe2f5fe43b67a528f29065a236 --- /dev/null +++ b/model/model/layers/24/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b4e56075e3b3a652a515644a3e07e0a5d1906495cfca85cfc68befb3762e27 +size 3673453 diff --git a/model/model/layers/24/self_attn/o_proj/kernel/0.3 b/model/model/layers/24/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..194053f3738eff2efd26eef1af090357f21ad3ac --- /dev/null +++ b/model/model/layers/24/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91aec1735bcbb0604838e6bd5c7ff9350ca5f89b462f8ad28232a15f0924c1a +size 3672715 diff --git a/model/model/layers/24/self_attn/q_proj/kernel/.zarray b/model/model/layers/24/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/24/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/self_attn/q_proj/kernel/0.0 b/model/model/layers/24/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d0a0d3982d8b4de16c917b3beb67b57e77070a80 --- /dev/null +++ b/model/model/layers/24/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ec83ed97553725138d0d4bc152625ee6e8c88be6622f6b7a7574e53a49a6be +size 3694399 diff --git a/model/model/layers/24/self_attn/q_proj/kernel/1.0 b/model/model/layers/24/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c69137008fe15d831ea9c5064033f9f8ad80e6fa --- /dev/null +++ b/model/model/layers/24/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464b0ed7e3114d16d88b7b43faf1968a598b7ae6d4a7703ba45aeb2939910e96 +size 3696997 diff --git a/model/model/layers/24/self_attn/q_proj/kernel/2.0 b/model/model/layers/24/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..66ac79cb04e3161769de8b923bf82455d43f8676 --- /dev/null +++ b/model/model/layers/24/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799f54b9857a18c9e94e366aaa5085f63b85dc8ca43a9ad1b173fadb9a22b022 +size 3694995 diff --git a/model/model/layers/24/self_attn/q_proj/kernel/3.0 b/model/model/layers/24/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8cfc9b7e35dc1dc1c251dd1844883007f38301ca --- /dev/null +++ b/model/model/layers/24/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f137f1f04444d3b267cca2b48fb260238beb1977ae9bd14c05dc8683c34829 +size 3694956 diff --git a/model/model/layers/24/self_attn/v_proj/kernel/.zarray b/model/model/layers/24/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/24/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/24/self_attn/v_proj/kernel/0.0 b/model/model/layers/24/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a759338d5c1683afe4215418d753d5a312259ff --- /dev/null +++ b/model/model/layers/24/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddd79185ed22b35526c17f5dfe97ee7d04aab30531ab463e899c332a558ab4b +size 1228511 diff --git a/model/model/layers/24/self_attn/v_proj/kernel/1.0 b/model/model/layers/24/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2def75d17be44da2ebc28b16bf0392e7f8f1e4ee --- /dev/null +++ b/model/model/layers/24/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848c0518d9a95eec791ac49df14ce1bc90e3bc06e5b21433c6c6eca9113c73da +size 1228758 diff --git a/model/model/layers/24/self_attn/v_proj/kernel/2.0 b/model/model/layers/24/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe1aa2bb5419ce140a728187198189951b436f3b --- /dev/null +++ b/model/model/layers/24/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad83b21c99fa61cb0ab912d6906a2a0a318006f3c1aa9ac6182d74f92b4ab690 +size 1228039 diff --git a/model/model/layers/24/self_attn/v_proj/kernel/3.0 b/model/model/layers/24/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5243b59cc1a4312085c8b825040ec1b3c1f614e2 --- /dev/null +++ b/model/model/layers/24/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b776173502bbd764a59a493984e359591607db95668135f73374aac24c73ab +size 1227902 diff --git a/model/model/layers/25/input_layernorm/kernel/.zarray b/model/model/layers/25/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/25/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/input_layernorm/kernel/0 b/model/model/layers/25/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..a67083a9d0f945c9d568811bac0a303f4f329905 Binary files /dev/null and b/model/model/layers/25/input_layernorm/kernel/0 differ diff --git a/model/model/layers/25/mlp/down_proj/kernel/.zarray b/model/model/layers/25/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/25/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/mlp/down_proj/kernel/0.0 b/model/model/layers/25/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b532a3d178e22e83ff1fddb049e57bd10d87b0b7 --- /dev/null +++ b/model/model/layers/25/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f774f7e8ee193705145e03cadfde1fda7521f2a48b4555ba0e109d0c6809fd +size 9807932 diff --git a/model/model/layers/25/mlp/down_proj/kernel/0.1 b/model/model/layers/25/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ad1775f8bec505606f637884b4539ce05de5b42d --- /dev/null +++ b/model/model/layers/25/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f95248b05a78cba900ef5b22eb6c108bb70fb3877173cda68bca723209c152 +size 9808623 diff --git a/model/model/layers/25/mlp/down_proj/kernel/0.2 b/model/model/layers/25/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..7f45450b97caf7fdb48a00f63ac24b1c5d8ce9fc --- /dev/null +++ b/model/model/layers/25/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153821134bfca75fb0e39913e4f9b5d6caabf15a1dee8d05b0f23ea8cfcc2de2 +size 9809427 diff --git a/model/model/layers/25/mlp/down_proj/kernel/0.3 b/model/model/layers/25/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2f0d6349a30f7b3d43d478fb4d1b27465b2a4e2f --- /dev/null +++ b/model/model/layers/25/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ac115a2de571e12c933e955793b65ac4c3f3d318a5a398228d8e0f252993cd +size 9807728 diff --git a/model/model/layers/25/mlp/gate_proj/kernel/.zarray b/model/model/layers/25/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/25/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/mlp/gate_proj/kernel/0.0 b/model/model/layers/25/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0c73d885051f5aea0a63d5a36325b27b3cb1930f --- /dev/null +++ b/model/model/layers/25/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855e417ced1a19f3ad52dbfaad62923454db95bc84f1c05ad7626295255ea1d1 +size 9824343 diff --git a/model/model/layers/25/mlp/gate_proj/kernel/1.0 b/model/model/layers/25/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..86eaa54e7f9b5f55fe7b02fda89b90edb3b9e2dd --- /dev/null +++ b/model/model/layers/25/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e193166f419f84f3f103ecb375b82e187ae19b296a0f0e832aaee86109c0b1 +size 9823703 diff --git a/model/model/layers/25/mlp/gate_proj/kernel/2.0 b/model/model/layers/25/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f51ec9d3d8089552ea7cf3ba02dcd548d61e4894 --- /dev/null +++ b/model/model/layers/25/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f184607deb9c655d7be0cb7a5271e145e96afc872ee2a04ae3cc7ef5d925d7 +size 9823834 diff --git a/model/model/layers/25/mlp/gate_proj/kernel/3.0 b/model/model/layers/25/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..78df2e4c951e73870d07b951d823611e943261cb --- /dev/null +++ b/model/model/layers/25/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89165a40f471d88c224994f89b5dc233f391d34b00bd32f098617efa6f30a5e3 +size 9824053 diff --git a/model/model/layers/25/mlp/up_proj/kernel/.zarray b/model/model/layers/25/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/25/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/mlp/up_proj/kernel/0.0 b/model/model/layers/25/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2807313809156fc009dd09bb99d7fff02b4ab31f --- /dev/null +++ b/model/model/layers/25/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e8a357e437f0bf33cf6f4319629e5ae158178cade34d160c699411f624675d +size 9793073 diff --git a/model/model/layers/25/mlp/up_proj/kernel/1.0 b/model/model/layers/25/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0600634c97a985c9bc2f3556a0c0c87f6fda59cf --- /dev/null +++ b/model/model/layers/25/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60dd19839e14555d2263373c888fe56b0c4c2aeb15cf5923b73e5078116a7c69 +size 9793377 diff --git a/model/model/layers/25/mlp/up_proj/kernel/2.0 b/model/model/layers/25/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e61179245e884678bd99817afb518082cfe11235 --- /dev/null +++ b/model/model/layers/25/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2136d08a4d3a54a30f1f8e92c3823a4d7147ea18181cd8537a4e7ef5e45909a6 +size 9793542 diff --git a/model/model/layers/25/mlp/up_proj/kernel/3.0 b/model/model/layers/25/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ca85dc40db3c5d73afa4a506e6206516a70dde57 --- /dev/null +++ b/model/model/layers/25/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5f45082f6836384ee293c5ba5376a6f4332c40aff04afa6028f51e0740c569e +size 9793378 diff --git a/model/model/layers/25/post_attention_layernorm/kernel/.zarray b/model/model/layers/25/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/25/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/post_attention_layernorm/kernel/0 b/model/model/layers/25/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..4fd81526f80040b5229ea316ac0443826093cf1b Binary files /dev/null and b/model/model/layers/25/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/25/self_attn/k_proj/kernel/.zarray b/model/model/layers/25/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/25/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/self_attn/k_proj/kernel/0.0 b/model/model/layers/25/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..abf8e0e1e553119678b491920fdfbfe0f6df4d69 --- /dev/null +++ b/model/model/layers/25/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d907c9d67c2003224cba1c7db950ed7367cb571a38d9713f25368c3e88d628e8 +size 1232644 diff --git a/model/model/layers/25/self_attn/k_proj/kernel/1.0 b/model/model/layers/25/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2fb59e8d12761aa7f8023ad0dd25500c70db333d --- /dev/null +++ b/model/model/layers/25/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd52a27893e0a21f5bd5a7e3f20f794306682f087a1bd78629da928305e0d97 +size 1233083 diff --git a/model/model/layers/25/self_attn/k_proj/kernel/2.0 b/model/model/layers/25/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..48e9b1b620520fa28e89ff7afda9da05506cc517 --- /dev/null +++ b/model/model/layers/25/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29aebfce188a1554261f847cc82abcdbb24462a8266e1c042a48c9e99d000f86 +size 1233179 diff --git a/model/model/layers/25/self_attn/k_proj/kernel/3.0 b/model/model/layers/25/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6b516ff59a41611acfc54d735368ad9cfa492aaf --- /dev/null +++ b/model/model/layers/25/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a4bb7cb58b1d0a8aa4739dfa1eefc02e9950fa7afa57489489b15d81358ed01 +size 1232813 diff --git a/model/model/layers/25/self_attn/o_proj/kernel/.zarray b/model/model/layers/25/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/25/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/self_attn/o_proj/kernel/0.0 b/model/model/layers/25/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..01a73d9f7c074823541491f6db462ca4ca66de79 --- /dev/null +++ b/model/model/layers/25/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55b828964ef62b9ee8cf460c4c3328030eaf5429fb1085e6fa7c587fbf90e379 +size 3674706 diff --git a/model/model/layers/25/self_attn/o_proj/kernel/0.1 b/model/model/layers/25/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1c88f85a86ae9c045136b48261f90b315a9ed6ea --- /dev/null +++ b/model/model/layers/25/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d146ff6275f3ac423a5098e71560df45097639211e44d19b8bace90ac9a3a9 +size 3674847 diff --git a/model/model/layers/25/self_attn/o_proj/kernel/0.2 b/model/model/layers/25/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..f7738c45dc2b4f7649db1bf8bc9df8fae92d1ad6 --- /dev/null +++ b/model/model/layers/25/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49058e29b6c3154d6e758358d7437cf41e7801558ea5c0332015db3ce6b7f2a3 +size 3675768 diff --git a/model/model/layers/25/self_attn/o_proj/kernel/0.3 b/model/model/layers/25/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2acc7e1d735b99b28900b52f6a92e57bdb999ab5 --- /dev/null +++ b/model/model/layers/25/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef72efac1aff07f92490fd4af15b2a7175e1fd9c6a771a987de1abd9dec3070 +size 3674628 diff --git a/model/model/layers/25/self_attn/q_proj/kernel/.zarray b/model/model/layers/25/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/25/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/self_attn/q_proj/kernel/0.0 b/model/model/layers/25/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e1c58350297916fede5ccc7c97bd4a927b07403 --- /dev/null +++ b/model/model/layers/25/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20964dba973cb6344f5ee897b5e0afae8791f09455b2470ff802930849d40f46 +size 3690859 diff --git a/model/model/layers/25/self_attn/q_proj/kernel/1.0 b/model/model/layers/25/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee3f12be8b75577172539ec9215f99af48f23d59 --- /dev/null +++ b/model/model/layers/25/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73d4b05dc970a4124554b811798cb33c3aeab4e2deced9f3fa6a6be4779e233 +size 3691338 diff --git a/model/model/layers/25/self_attn/q_proj/kernel/2.0 b/model/model/layers/25/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..18122de549fb62faaca71931a31f288f477308fa --- /dev/null +++ b/model/model/layers/25/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8356977f97d9ee9667e38dc428460e1dda19849b5b8279327af6e486afd352 +size 3690961 diff --git a/model/model/layers/25/self_attn/q_proj/kernel/3.0 b/model/model/layers/25/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b4e64f9e60d3207da3241e87faa2fe48840db73f --- /dev/null +++ b/model/model/layers/25/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105e8943b464db5d412fa1dca5f70df76e37f09db3986b502be0e9d669823e47 +size 3690327 diff --git a/model/model/layers/25/self_attn/v_proj/kernel/.zarray b/model/model/layers/25/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/25/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/25/self_attn/v_proj/kernel/0.0 b/model/model/layers/25/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4041a7778883d19d69b74b8b3ac90fcd7b8e0d71 --- /dev/null +++ b/model/model/layers/25/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8de77071cf8b7204b72e55c2cc890d7414c383f50f72c1cfd53b2d45c3edd99 +size 1228989 diff --git a/model/model/layers/25/self_attn/v_proj/kernel/1.0 b/model/model/layers/25/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3df885f4b85717dff6bcae65da3a57b0123cba04 --- /dev/null +++ b/model/model/layers/25/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7326dec966ab9e225f0d982b04677b1eddeed301ec932502499ef6ceded03248 +size 1229407 diff --git a/model/model/layers/25/self_attn/v_proj/kernel/2.0 b/model/model/layers/25/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..398cbe8cd2ce0c0f1075c101509576066c4943db --- /dev/null +++ b/model/model/layers/25/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b401b0b49175abe1faefb048df1888333bcda580a27ec10986a66961e0877eec +size 1229012 diff --git a/model/model/layers/25/self_attn/v_proj/kernel/3.0 b/model/model/layers/25/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5a25dd3feb89631b4c01b4f66be344b3afd58452 --- /dev/null +++ b/model/model/layers/25/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927b31fd6f20ff5d9470a31e69f27bd6c790426718b700694161669a2ff842c8 +size 1228753 diff --git a/model/model/layers/26/input_layernorm/kernel/.zarray b/model/model/layers/26/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/26/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/input_layernorm/kernel/0 b/model/model/layers/26/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..0694ef487d2bc34a4dd9506a0fde9867e8d19a2a Binary files /dev/null and b/model/model/layers/26/input_layernorm/kernel/0 differ diff --git a/model/model/layers/26/mlp/down_proj/kernel/.zarray b/model/model/layers/26/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/26/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/mlp/down_proj/kernel/0.0 b/model/model/layers/26/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f81dbadb14d825d6c68dbcaf9a38aa56e4dc8b88 --- /dev/null +++ b/model/model/layers/26/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc134eaff28bbd3eee6f8794e3ff7d360abab0ad4390645d1dba827d434f991 +size 9812022 diff --git a/model/model/layers/26/mlp/down_proj/kernel/0.1 b/model/model/layers/26/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ecc7a183b8bdc6d8fd3e820af1f1a5943de1c085 --- /dev/null +++ b/model/model/layers/26/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fc5495b93718e2f2eca0af72313f4b56f57fdd4902b421489c9346e00ffc0c +size 9813626 diff --git a/model/model/layers/26/mlp/down_proj/kernel/0.2 b/model/model/layers/26/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..4db258f180535ee99c863464b930d60b8b46d0eb --- /dev/null +++ b/model/model/layers/26/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c248370c58816d1697f8eabee816032913e2d494f980c651a031da4c7ee92f5f +size 9813979 diff --git a/model/model/layers/26/mlp/down_proj/kernel/0.3 b/model/model/layers/26/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f45b1e0aad9712210cc1def45b314fae02c4a198 --- /dev/null +++ b/model/model/layers/26/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b02951f8094278f51d974cebd49ad0ed8dfbb62dee10ce82b77444ca0bf56038 +size 9811831 diff --git a/model/model/layers/26/mlp/gate_proj/kernel/.zarray b/model/model/layers/26/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/26/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/mlp/gate_proj/kernel/0.0 b/model/model/layers/26/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..22ae615186b49bbbfc06f645a15f33917ff1b793 --- /dev/null +++ b/model/model/layers/26/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1face1ee42162fff7162b7cf5b3c741184344f6a8c939572d9239190f60e29 +size 9829521 diff --git a/model/model/layers/26/mlp/gate_proj/kernel/1.0 b/model/model/layers/26/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..29f5f7a6fc6e3e4aac7194c141f4e71a55a69cb7 --- /dev/null +++ b/model/model/layers/26/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda4b20241cd64eac90205f5efa054c6f1ca1302b60e8a019d7e69f71e757a68 +size 9829239 diff --git a/model/model/layers/26/mlp/gate_proj/kernel/2.0 b/model/model/layers/26/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ebb4b93249412dbce60b1a52a0c8cceaef4bcd00 --- /dev/null +++ b/model/model/layers/26/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4480cadb7b8686941b51b5dadb05dd62a65559fe0bdab610b0342b50b166aac2 +size 9829970 diff --git a/model/model/layers/26/mlp/gate_proj/kernel/3.0 b/model/model/layers/26/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0c5a72a3bc5b97b94c5634dcf58e5e387e2e61cd --- /dev/null +++ b/model/model/layers/26/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701805657c2108aa94dd8875f8fc0a93dea0795cab9ffc6c759dbf6f1affb65f +size 9830084 diff --git a/model/model/layers/26/mlp/up_proj/kernel/.zarray b/model/model/layers/26/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/26/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/mlp/up_proj/kernel/0.0 b/model/model/layers/26/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e4004f533636f8464ccd18e42b1c9f71c0197d99 --- /dev/null +++ b/model/model/layers/26/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecc1a4c91f8b18fbf1042ae3f5e3d241b15fe1caedf93a160a95b81693feca46 +size 9794873 diff --git a/model/model/layers/26/mlp/up_proj/kernel/1.0 b/model/model/layers/26/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..144c67fb0f7277efd4b62596c15af0d7a43229a9 --- /dev/null +++ b/model/model/layers/26/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e22f8185044cd4f3cf0cb9bb28739b13bc2aae8ac850e41ff4e3ca24398b20e8 +size 9795424 diff --git a/model/model/layers/26/mlp/up_proj/kernel/2.0 b/model/model/layers/26/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a78ecf35fcdc6161a1fc4513fb431ff8e34be6f7 --- /dev/null +++ b/model/model/layers/26/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd1b949b6609a71d536faccb1891c6efbf0f1e76c88b82a014f78fe4fec4eca +size 9795596 diff --git a/model/model/layers/26/mlp/up_proj/kernel/3.0 b/model/model/layers/26/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ada7a27881a4cfaa4c3a36d742ac940bf0788d42 --- /dev/null +++ b/model/model/layers/26/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf39c696b83bde7abb1b2f7a336d77684d70f1e1757a172ef10b27b3098c26f +size 9795598 diff --git a/model/model/layers/26/post_attention_layernorm/kernel/.zarray b/model/model/layers/26/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/26/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/post_attention_layernorm/kernel/0 b/model/model/layers/26/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..281b4840267bc7276b348a69d2b977a757444d75 Binary files /dev/null and b/model/model/layers/26/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/26/self_attn/k_proj/kernel/.zarray b/model/model/layers/26/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/26/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/self_attn/k_proj/kernel/0.0 b/model/model/layers/26/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ba39186477a71bfb747417fe48bf958cc16bfc72 --- /dev/null +++ b/model/model/layers/26/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84abf6039015e39b29c84b9667bee72153aae6fdeecbc37f14a5a4bb6741a96c +size 1234824 diff --git a/model/model/layers/26/self_attn/k_proj/kernel/1.0 b/model/model/layers/26/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..33f5065660d350595b7d40c27ad808a48f28678e --- /dev/null +++ b/model/model/layers/26/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5af25a54cda0629c0c92d7138432a6ca570856923d8cea6a845ff9ee972c400 +size 1234748 diff --git a/model/model/layers/26/self_attn/k_proj/kernel/2.0 b/model/model/layers/26/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..09beeae6dc3ba23964fecd7cdac75114caab1d95 --- /dev/null +++ b/model/model/layers/26/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed87bdaf1c516ab7c355a52eff45971050c5b259743f08b283f565776e62dd69 +size 1234881 diff --git a/model/model/layers/26/self_attn/k_proj/kernel/3.0 b/model/model/layers/26/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..522726260b755c9fd06e0577d1247d4f0062e19c --- /dev/null +++ b/model/model/layers/26/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af2d3ec8aeba4f1409bd9a8edb2ac81578063253e9513c927a35f3bcef76e1e0 +size 1234300 diff --git a/model/model/layers/26/self_attn/o_proj/kernel/.zarray b/model/model/layers/26/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/26/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/self_attn/o_proj/kernel/0.0 b/model/model/layers/26/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fcaf8d41fcd186220027ec970ff07c4e57e76e7e --- /dev/null +++ b/model/model/layers/26/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23524238f7350f9dbc8feda0f9e7f0b68f266e7c2d1829ee8621637f752724d3 +size 3678677 diff --git a/model/model/layers/26/self_attn/o_proj/kernel/0.1 b/model/model/layers/26/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..397a8fd7041e1c14e1a289020a842dc0b0460373 --- /dev/null +++ b/model/model/layers/26/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d695d5d83a55ca3964fb08da83678c1e407a00bf1d3ca35c9ad77be743b01c58 +size 3678321 diff --git a/model/model/layers/26/self_attn/o_proj/kernel/0.2 b/model/model/layers/26/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..eade8ea63db5e203d90966fd84bc76a789fb1a97 --- /dev/null +++ b/model/model/layers/26/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cbf4aec14bd0785004bdcc5692890c0dae862a3b5a9634aec1b0a630c5b6616 +size 3679669 diff --git a/model/model/layers/26/self_attn/o_proj/kernel/0.3 b/model/model/layers/26/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..aacfc5c9f735936bda97d0a54576538790bb32ca --- /dev/null +++ b/model/model/layers/26/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860cf7a1d5d4628d188ddf93e3943f7f1574b736d98887229b3aa7735902b64d +size 3677628 diff --git a/model/model/layers/26/self_attn/q_proj/kernel/.zarray b/model/model/layers/26/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/26/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/self_attn/q_proj/kernel/0.0 b/model/model/layers/26/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3f11f1ab6a15ac0ee9d60d2432654dbd2379a46d --- /dev/null +++ b/model/model/layers/26/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723f07ca81bdc0aa23d5ed89fe6de22cf5b03143543376df93ec93c34c6e8cb6 +size 3706317 diff --git a/model/model/layers/26/self_attn/q_proj/kernel/1.0 b/model/model/layers/26/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b7cb990bff8ebbffb5828818cd221decf5c711ee --- /dev/null +++ b/model/model/layers/26/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688a9ab92311b9ce7fbef235b50c766a412510ba36969ba1c6a7f51f0bde5f9e +size 3706080 diff --git a/model/model/layers/26/self_attn/q_proj/kernel/2.0 b/model/model/layers/26/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ad2bcb27224fc0879cdf276d7dc267a81f1b68cd --- /dev/null +++ b/model/model/layers/26/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85101df41c0bbabb0c0beed3a5997501f563cdb0b3b7bb5ca8eb79e0bfb2a4bc +size 3706421 diff --git a/model/model/layers/26/self_attn/q_proj/kernel/3.0 b/model/model/layers/26/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e0360680adf623f04d5589577769531f7e1be3c4 --- /dev/null +++ b/model/model/layers/26/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad21a56369aded41bbe95f6fa8953a462a2ad123b91570450e0844d256e248cb +size 3706538 diff --git a/model/model/layers/26/self_attn/v_proj/kernel/.zarray b/model/model/layers/26/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/26/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/26/self_attn/v_proj/kernel/0.0 b/model/model/layers/26/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6eb488ffbdf0a2f6dafb80cc9bd83c1b9bb72dae --- /dev/null +++ b/model/model/layers/26/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ed4ade6ba73e97b869acc851d31a453ae7b2481f9745ce3d9cbba71ebdc368e +size 1232322 diff --git a/model/model/layers/26/self_attn/v_proj/kernel/1.0 b/model/model/layers/26/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d4818e4abf229e4c93b20ad446ee40c0739a8804 --- /dev/null +++ b/model/model/layers/26/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e705d41f97e758fc1a468a0b3ff2cdf09ba1ec886092618179f6e157d57a9caa +size 1232646 diff --git a/model/model/layers/26/self_attn/v_proj/kernel/2.0 b/model/model/layers/26/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9073a895a3ee0bfb3795e052b6e977c26667a91b --- /dev/null +++ b/model/model/layers/26/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:797644a3a50623f2dc6fc877fafb92993ad2ca34bc767bd24b8db49d0a636485 +size 1232405 diff --git a/model/model/layers/26/self_attn/v_proj/kernel/3.0 b/model/model/layers/26/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..39131d026e1df2933956211173dc54ae50e23285 --- /dev/null +++ b/model/model/layers/26/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065ff679e931f336520dc9a1e522f3634aadbe93820a8d88b3e432a8800e90b9 +size 1231855 diff --git a/model/model/layers/27/input_layernorm/kernel/.zarray b/model/model/layers/27/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/27/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/input_layernorm/kernel/0 b/model/model/layers/27/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..8a3e54deb3c494116be070388b70025a6c6d79ef Binary files /dev/null and b/model/model/layers/27/input_layernorm/kernel/0 differ diff --git a/model/model/layers/27/mlp/down_proj/kernel/.zarray b/model/model/layers/27/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/27/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/mlp/down_proj/kernel/0.0 b/model/model/layers/27/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d6a8ce433180a6957d2032a735e14959ec12bd44 --- /dev/null +++ b/model/model/layers/27/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803e8bd2086d9212a3f93eac66a8b8a4e1b39b7b581a42c49f81b702be477430 +size 9815427 diff --git a/model/model/layers/27/mlp/down_proj/kernel/0.1 b/model/model/layers/27/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..828103fe17bfa88c2cce0450ccee25d329e9e5e3 --- /dev/null +++ b/model/model/layers/27/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37745b037e2ad901e45a265f5b87c4a28550ed2fa301fab4fca85f18360f676d +size 9815880 diff --git a/model/model/layers/27/mlp/down_proj/kernel/0.2 b/model/model/layers/27/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..1b17f82fa3b990692dc24c499c9ca7b33c555e52 --- /dev/null +++ b/model/model/layers/27/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f835eb2fbdb7787b64ff139d775c537c494db0fa51323ea6d71ee7d75c686e +size 9816698 diff --git a/model/model/layers/27/mlp/down_proj/kernel/0.3 b/model/model/layers/27/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b40029e6d8640231b8957d3fb8a05b12fac42e32 --- /dev/null +++ b/model/model/layers/27/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aca36e6f33968f1d69af777e20061c5b5a6a85405ed02cb42486e5249474d67c +size 9813186 diff --git a/model/model/layers/27/mlp/gate_proj/kernel/.zarray b/model/model/layers/27/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/27/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/mlp/gate_proj/kernel/0.0 b/model/model/layers/27/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..20bacf0b486331594eb3eee2b0d55087992f7148 --- /dev/null +++ b/model/model/layers/27/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf31507e2b819c9b86f8a0ca65dcc611e8f474e8c673f1bea97a25f0e1f2910 +size 9838427 diff --git a/model/model/layers/27/mlp/gate_proj/kernel/1.0 b/model/model/layers/27/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..49810f20948ed5f1a2be987998eef4391e9f9b40 --- /dev/null +++ b/model/model/layers/27/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77f24a707aac6a086149bc004eddf3c21625d76d7237ec66ba3a505601fafec +size 9840163 diff --git a/model/model/layers/27/mlp/gate_proj/kernel/2.0 b/model/model/layers/27/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9e9befccd826e20da6a48da59584927477835dc6 --- /dev/null +++ b/model/model/layers/27/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266e43de1489cbe77612b1c59bbc5c89914049101fab00c96de486ce0b023e44 +size 9839301 diff --git a/model/model/layers/27/mlp/gate_proj/kernel/3.0 b/model/model/layers/27/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a45e02a1094ee1949ffabde401cabc604128875 --- /dev/null +++ b/model/model/layers/27/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6f99d6fee3c3fb1f98ce7dd85edd328653a3356cdd770d503e7211cb1f65c2 +size 9838837 diff --git a/model/model/layers/27/mlp/up_proj/kernel/.zarray b/model/model/layers/27/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/27/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/mlp/up_proj/kernel/0.0 b/model/model/layers/27/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c85ef40534aad7d74eab5f886fe85afa18c82fca --- /dev/null +++ b/model/model/layers/27/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c6323a982cb4fc39c284930c27d66b86f3b7c5cb5d2a7af37621333c29b2e3 +size 9808272 diff --git a/model/model/layers/27/mlp/up_proj/kernel/1.0 b/model/model/layers/27/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6dca0f799d4dae2e5c2c023af542281317019a09 --- /dev/null +++ b/model/model/layers/27/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c8649917f30187cb07a1cf08d849e659120f35291063cd7977d5db311d416d +size 9808572 diff --git a/model/model/layers/27/mlp/up_proj/kernel/2.0 b/model/model/layers/27/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f9efa8439c59443d7cbb5d0d63236ac9462193bf --- /dev/null +++ b/model/model/layers/27/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:599d27dfbf75b98cc6f5ba71c2145d594505937966da100f322c5ac46a102edc +size 9809406 diff --git a/model/model/layers/27/mlp/up_proj/kernel/3.0 b/model/model/layers/27/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d0e3bb1d8690484db0c279accff006920a9677dc --- /dev/null +++ b/model/model/layers/27/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c316f1808c42909684a5fa0d5a09d498599f4e2194f733dce09a1a78915b33e +size 9807088 diff --git a/model/model/layers/27/post_attention_layernorm/kernel/.zarray b/model/model/layers/27/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/27/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/post_attention_layernorm/kernel/0 b/model/model/layers/27/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..86adabca098bee417fa9edd4af2b33d9bc8213a6 Binary files /dev/null and b/model/model/layers/27/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/27/self_attn/k_proj/kernel/.zarray b/model/model/layers/27/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/27/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/self_attn/k_proj/kernel/0.0 b/model/model/layers/27/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a26a6a4248e00f52fbc583a3da9e4dc4e4655c6f --- /dev/null +++ b/model/model/layers/27/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff20a43f3994b13fbe01b032e72748277dfb5ac8778d768d1b82e65d375f4fbb +size 1232807 diff --git a/model/model/layers/27/self_attn/k_proj/kernel/1.0 b/model/model/layers/27/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ae194d251fdd85e4c61cced5904b07f7738fea5 --- /dev/null +++ b/model/model/layers/27/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d6016aa59736a66eeae2b88b92917945259b4fcb630fb4f6fbc46be576edbde +size 1232996 diff --git a/model/model/layers/27/self_attn/k_proj/kernel/2.0 b/model/model/layers/27/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..faed5bb6a6034767d39f64109f342c920ca227f3 --- /dev/null +++ b/model/model/layers/27/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704b5c772d56fc67c7122a5ef07262e2fd03591cb9982468f333d07db5b1e75c +size 1232944 diff --git a/model/model/layers/27/self_attn/k_proj/kernel/3.0 b/model/model/layers/27/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d5ddebf8dd05ef988c11b824fd37d7d50c9a5e7d --- /dev/null +++ b/model/model/layers/27/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d18aaa5e878ecbc38820b28f78d6bb1deb9026f4c2fc4135b63a1616bae3c1 +size 1232751 diff --git a/model/model/layers/27/self_attn/o_proj/kernel/.zarray b/model/model/layers/27/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/27/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/self_attn/o_proj/kernel/0.0 b/model/model/layers/27/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4e91ce7c76259f484c099bd4d09788fcce753e6a --- /dev/null +++ b/model/model/layers/27/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7fa32cf98e5e2c19b0614b72bf2d4a08a095caf273d229e9662f99307e1d3a +size 3678751 diff --git a/model/model/layers/27/self_attn/o_proj/kernel/0.1 b/model/model/layers/27/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7107a46935a56b6b1890e4dea78f6e3ae539e63e --- /dev/null +++ b/model/model/layers/27/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf11070380259bc5286c208dc6540943d6a7ffd5ac055b27c8236d537a0db339 +size 3678737 diff --git a/model/model/layers/27/self_attn/o_proj/kernel/0.2 b/model/model/layers/27/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..fbba0e1cc84c8a2bb91fb34f4016ec79b80cf95d --- /dev/null +++ b/model/model/layers/27/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51172cf237336030337d5c780e1e0c4fe9961c342572abeb22101d9a39563db +size 3679875 diff --git a/model/model/layers/27/self_attn/o_proj/kernel/0.3 b/model/model/layers/27/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..aabfa596cf350ff024ce0f94bf3ba272a2fc953a --- /dev/null +++ b/model/model/layers/27/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b36d03a63d0246764870c8fa19037d3c980f7fe548d0985f94cc0054f853463 +size 3677939 diff --git a/model/model/layers/27/self_attn/q_proj/kernel/.zarray b/model/model/layers/27/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/27/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/self_attn/q_proj/kernel/0.0 b/model/model/layers/27/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..06f28bd5dcb4c5953c2ba084e766984bb2d802b5 --- /dev/null +++ b/model/model/layers/27/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdf22db7789f82d8dc30d1417d5394dc706bcf77bcde93ea9fd71d275c07b5e +size 3697327 diff --git a/model/model/layers/27/self_attn/q_proj/kernel/1.0 b/model/model/layers/27/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f98cb8ba9370b792e7a9a99f97f9f4309b468f03 --- /dev/null +++ b/model/model/layers/27/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd77b2fbf2e2e232c4f6e60b9ce66b465245f94089c68deeee7e4ae4a42b1b4 +size 3697275 diff --git a/model/model/layers/27/self_attn/q_proj/kernel/2.0 b/model/model/layers/27/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..01b3ab7c4de016089c4ed936c35396d15e57dd59 --- /dev/null +++ b/model/model/layers/27/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeee05181475cb3c25cad3843e64a7959a80ee93b27f6f2ab5d1c07f63b8aa85 +size 3697064 diff --git a/model/model/layers/27/self_attn/q_proj/kernel/3.0 b/model/model/layers/27/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a5686a2f235081f01df0c42a83cd029671dad99 --- /dev/null +++ b/model/model/layers/27/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd58ed9330b52f501fd19541c8c7f7671ca10097cd47c3dffd832c48284491e8 +size 3696536 diff --git a/model/model/layers/27/self_attn/v_proj/kernel/.zarray b/model/model/layers/27/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/27/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/27/self_attn/v_proj/kernel/0.0 b/model/model/layers/27/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f11bf6b1c82c713d6002826d0cc78033835263a6 --- /dev/null +++ b/model/model/layers/27/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2998925c8e6b0520e58fd617dd0d28937b157aa1aeab8172d6cbc6029445db +size 1228472 diff --git a/model/model/layers/27/self_attn/v_proj/kernel/1.0 b/model/model/layers/27/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1fbb3acc9b817a2f24e4abc5cae37b462667fea6 --- /dev/null +++ b/model/model/layers/27/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34f767946af08a0c14cd02f18e647fb956fb2e894dba794c821830a345368c8 +size 1228963 diff --git a/model/model/layers/27/self_attn/v_proj/kernel/2.0 b/model/model/layers/27/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f42cec825d87d41f554da73549f4f50db6983a61 --- /dev/null +++ b/model/model/layers/27/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b3e13a5871cb5a2703201728c4d97ffaf96326de602316e8a9a0232c58ffe1 +size 1228631 diff --git a/model/model/layers/27/self_attn/v_proj/kernel/3.0 b/model/model/layers/27/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e9fe1cc93ff472ffaec5f103ce6c065f94b79ed --- /dev/null +++ b/model/model/layers/27/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9b4844edb6921759d03a093704e934a493001161c5888a15e19563ab12659d +size 1228080 diff --git a/model/model/layers/3/input_layernorm/kernel/.zarray b/model/model/layers/3/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/3/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/input_layernorm/kernel/0 b/model/model/layers/3/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..87d683874a6f421c5be79f546e737cefc605897e Binary files /dev/null and b/model/model/layers/3/input_layernorm/kernel/0 differ diff --git a/model/model/layers/3/mlp/down_proj/kernel/.zarray b/model/model/layers/3/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.0 b/model/model/layers/3/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..42b7a584f48d6e4efdbe28464e94aeb7128b27f7 --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca784c7798cc9bbdf2c18233b013049ea1af1b09f72dcd3c6d0b8462749e03f +size 9791659 diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.1 b/model/model/layers/3/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..4769034f30f9906c12550c07659b2b9c1d266d25 --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d1d0c231b7265ab06425b4a6e101d7ae5fd2d7a6f694489dd09df7f9660ab1 +size 9793644 diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.2 b/model/model/layers/3/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..344433478eaabb2475adb924dd6cc7ccd867f4c5 --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5b4b29e88d0a1ba3d21cc33e78eccccc2ce60ac72084f364fb141e122a3fcb +size 9790977 diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.3 b/model/model/layers/3/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..3b4a418216c7a9851f9f80378b443a22bd4c9b90 --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd2e92c5e3cc04c4711b624447e241a2c1e58b565b37585c5055d54fcca280e +size 9793296 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/.zarray b/model/model/layers/3/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/mlp/gate_proj/kernel/0.0 b/model/model/layers/3/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..30da07196b7f651fd108a4a2cc21a6a9056d4059 --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cabbb1464da5a787ddc70c76725b5cb8e3ecf7ba4e623e9c416033ce7c14a36 +size 9808509 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/1.0 b/model/model/layers/3/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..878ade16fe5a53d03febd0c0a18622751a76ec64 --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62844249d89b4fee9903dcaae4dd2d1b451ebb6cded259d9f21f03ec83ac3da4 +size 9806669 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/2.0 b/model/model/layers/3/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..250936566ae2d92e91e356b4c394e4c48def43ef --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224115d132405ebe85859a44e37e7fdfabd37838ad3570e48e405c1e3bf67a57 +size 9807260 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/3.0 b/model/model/layers/3/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..19ebd3610ad738f2110e4f7710be96891414f2e9 --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8159137a155f0820eb700facba683d645b6247996f19f58baeeeca10b96f16f +size 9807132 diff --git a/model/model/layers/3/mlp/up_proj/kernel/.zarray b/model/model/layers/3/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/mlp/up_proj/kernel/0.0 b/model/model/layers/3/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a73b34134c626570b9b76cad54098c2a26e90532 --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16a19967615a708093eb687568c8d9ab06b50ca165b45ecf03d32eb6351122a +size 9790159 diff --git a/model/model/layers/3/mlp/up_proj/kernel/1.0 b/model/model/layers/3/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2694e3195a4af4106fda1b404583e323193bdad1 --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ef8e136507df9830cc1fff0dcea6a96eb5f94e7195a2ddb4647e88e7257206 +size 9789162 diff --git a/model/model/layers/3/mlp/up_proj/kernel/2.0 b/model/model/layers/3/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fb99d79095f06bc870be8a839f059dddbaf15c35 --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5c2eeca363f3d227edc23ca18e99a0023d24e9b881348365f4ffec9a8f703c3 +size 9790544 diff --git a/model/model/layers/3/mlp/up_proj/kernel/3.0 b/model/model/layers/3/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6ad1e1129730e39c3c44e4d538f70215a6d18f6b --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f600427f93dc076e5501c55956f59b12306c400621017bd79bef5163a9343c5d +size 9789453 diff --git a/model/model/layers/3/post_attention_layernorm/kernel/.zarray b/model/model/layers/3/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/3/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/post_attention_layernorm/kernel/0 b/model/model/layers/3/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..0e7a673003ee40f027fa97ec05631f2d7019e811 Binary files /dev/null and b/model/model/layers/3/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/3/self_attn/k_proj/kernel/.zarray b/model/model/layers/3/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/k_proj/kernel/0.0 b/model/model/layers/3/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..99971de7996f2e4ed590a298d3adfbe3b8e3d8e0 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abafc658bbf82e8915045fdec49aec7f7b4c3876d4c5a021824611d6e7baf644 +size 1235532 diff --git a/model/model/layers/3/self_attn/k_proj/kernel/1.0 b/model/model/layers/3/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c635728bc11ff795aa472ebfdfddad3234bd713e --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e0fa7156475d808209d2a8ac68da62dcbffafa63b673b31aab5853c95fc7e1 +size 1235327 diff --git a/model/model/layers/3/self_attn/k_proj/kernel/2.0 b/model/model/layers/3/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9367d81b49ece293ae7148c46501018b028cf699 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ccce3390b82f0e350b8e9de9ea5049d3edaaa98af105d50ec15fdf91c197084 +size 1235567 diff --git a/model/model/layers/3/self_attn/k_proj/kernel/3.0 b/model/model/layers/3/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e5b62e8ea7ca1ee81a523b51c1bedfb4c8f91e73 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ffba97318600f74769ffb67f809ab1c60ab9c2f652960bd9da0a7cabcb7010b +size 1235727 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/.zarray b/model/model/layers/3/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.0 b/model/model/layers/3/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..45777fd8941336b71c19d9ff043b2e09473586fa --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e7add1d772c323368f5ff8aca7feeb0f7b8945995128eba152aa97a19a5a8e +size 3666449 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.1 b/model/model/layers/3/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..0d5478b49317f117ed82cf6b9b607b14b65ca497 --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee5758efc88d74d12979026eee185518f2f3ee9f895dfea4c0720be3371b7af +size 3667274 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.2 b/model/model/layers/3/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..aa899873fde466879191f6b1f8b2969cf02d9a63 --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b774d2ffdc0383fa21f1c7153d303461840625418df2b8836947d9c45ceced2b +size 3666168 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.3 b/model/model/layers/3/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f5d102a800c6528300c9bbcb61a7164e52dac896 --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bda8736bde217e6ca0dc20e8e70d00501436dcbd3d415253c0d29d8ad4fa4f3 +size 3667028 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/.zarray b/model/model/layers/3/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/q_proj/kernel/0.0 b/model/model/layers/3/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ccd23409bf52717b90759857e14dce5f98e88189 --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12df501cc80ec85f514f51edad2376250dbe14461f26156a97f6ce563fd0cb19 +size 3702068 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/1.0 b/model/model/layers/3/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b3f9b3c45b31e06a0a705bdf61eb39537e6ad2b --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350534a42782e88d3f64b235d7e6fc202ab638daec04710099fd3ad919447401 +size 3701919 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/2.0 b/model/model/layers/3/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8ff2d44ef1c6ee45e53e59e80088398c30564d16 --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd630b2c41a3924d0a0c1cda59c9921248ab19672f451e8ccd54003e837715b6 +size 3701671 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/3.0 b/model/model/layers/3/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..015a633341d5484321cd9b228342c30bed6ec4d6 --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e2ca92780e54b26bc5f20c574d8f634114ea5f0bad1f45e47dc394339045a7d +size 3703199 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/.zarray b/model/model/layers/3/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/v_proj/kernel/0.0 b/model/model/layers/3/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec4a72db2e917ff9d67a39f7982aa0df5551867b --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f0b224056f089d32f23281c0f5c2c00a3210c80c226416cb6395d1978d3be9 +size 1224585 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/1.0 b/model/model/layers/3/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c41a77170c21f109e78851677918969534f484c5 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7fed9d397f454941561b4b1e69a19144354af70f7fa546f5c753f0348bcdf9 +size 1225242 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/2.0 b/model/model/layers/3/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..44623d1ac3fce2dfb1135f8d52d01e2eb44af0da --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:152af568e0639fdd67254b06a094313df722a2c70bcb9e02f6c4b85d2e4a23c6 +size 1224696 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/3.0 b/model/model/layers/3/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d7cb81c7c26c54b94c9b92b13c5d885ea1830d72 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80c1801f8f760cfb86c1834877aba301881b095ca48387fea6387a01f0de534 +size 1224592 diff --git a/model/model/layers/4/input_layernorm/kernel/.zarray b/model/model/layers/4/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/4/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/input_layernorm/kernel/0 b/model/model/layers/4/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f1d0a231163c9f76370881d547e515fb39fe2b8a Binary files /dev/null and b/model/model/layers/4/input_layernorm/kernel/0 differ diff --git a/model/model/layers/4/mlp/down_proj/kernel/.zarray b/model/model/layers/4/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.0 b/model/model/layers/4/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9b32ae51d7c6cf16ef1d68f548779094f66e9472 --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3efa9f9237b55c8148467eee92d0c97d16d2d098b001c6075cc59206f6fba4cc +size 9791375 diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.1 b/model/model/layers/4/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3d8af09910b40cbaf9dfc46486af061ad9296f04 --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55b8e7f4c4d171c8bdb654200009c500bce5343794b6820ff284337fcf1403f +size 9792610 diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.2 b/model/model/layers/4/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..eef4ef6095b14e47da83969320f4943dcfd36244 --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:668b6194f602a2b90b71c1af10885c62b0862a572da60a15d37f4a00f34d5a98 +size 9790228 diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.3 b/model/model/layers/4/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c2bb87adcf761e76105d844b39cb2b336103cda8 --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4dea6ad4d4a64d2a5268414915c67bc3815582aaf233f5bb1393ea5ae5b3d4b +size 9791624 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/.zarray b/model/model/layers/4/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/mlp/gate_proj/kernel/0.0 b/model/model/layers/4/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e9f7fdb92825a88f2028aeb167846ee5155e13f3 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0d9c34450da970fef3ba23cdfef438327a8b022194dbe13138e76c6aa33084 +size 9823952 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/1.0 b/model/model/layers/4/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7129c3fe9f64292e0fb3fe02c4bb7a53625c4400 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad07328d0f5e8357c47bf8f5fe3ef61002d4238a53d4dd9e12ce78e0f226b1b +size 9821303 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/2.0 b/model/model/layers/4/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ebedc7549a0d89eca436e782765280a9f87b3f05 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f37101a8e63312704a9efb1d715230391cd613d262752809b5f2c891b97931 +size 9820904 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/3.0 b/model/model/layers/4/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f6bf143793134e1b2dcf6a398cf4ecc612b3ff3 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4bcc5ed936e0f8c97a2bbb7fdf8807e654412a936f828b33fa012506dd8d90 +size 9821615 diff --git a/model/model/layers/4/mlp/up_proj/kernel/.zarray b/model/model/layers/4/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/mlp/up_proj/kernel/0.0 b/model/model/layers/4/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5d8e71add71b5861faa2aee774080ba9a6edf237 --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e38396a959061bdb558d2273159ec5aedc380a6ea6807e2824cb45061cfa29 +size 9788326 diff --git a/model/model/layers/4/mlp/up_proj/kernel/1.0 b/model/model/layers/4/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9c0a00fd5551622907946b498a028e4531a99b9b --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e134da6b33c35829c9a4d94c4044c266b8a01c9df5a579c586c41e3ec98787 +size 9787041 diff --git a/model/model/layers/4/mlp/up_proj/kernel/2.0 b/model/model/layers/4/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a653a1476e89be03c036bca88005f4d4d17560c --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54bfe95db028aec213d42015ed9fffbc3ea1f4872d56dfd70c7ff93d7e686786 +size 9787103 diff --git a/model/model/layers/4/mlp/up_proj/kernel/3.0 b/model/model/layers/4/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..38c15c045c04362335cb6c59184c690213a88324 --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ec8f656b2ad356f9c2a75e83ef64a6d609d9e0bd2da116a06ebde95b295c55 +size 9786848 diff --git a/model/model/layers/4/post_attention_layernorm/kernel/.zarray b/model/model/layers/4/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/4/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/post_attention_layernorm/kernel/0 b/model/model/layers/4/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..7dcc50e5d605be416604e085ff3733cb2ed2f844 Binary files /dev/null and b/model/model/layers/4/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/4/self_attn/k_proj/kernel/.zarray b/model/model/layers/4/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/k_proj/kernel/0.0 b/model/model/layers/4/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c54ec50710b63614cadb5227abdb5e312f731fe6 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b51293c1219b6dfa8e8696dd490062e8bb97d9d070c96935ed70cdc84b4925 +size 1234176 diff --git a/model/model/layers/4/self_attn/k_proj/kernel/1.0 b/model/model/layers/4/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..74a4e47e0396ce289ec266b666a98742df7616d9 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba90057012275209b7957aa8a6736319390070998100b380bad3311f8d3298b5 +size 1234066 diff --git a/model/model/layers/4/self_attn/k_proj/kernel/2.0 b/model/model/layers/4/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b0a9d57ede99f1bd9eb24f7817a73eca97317731 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee81d8116019ff055c976b6b6e002d59396e67b8c105bfcbba54fe03bd3394e +size 1234044 diff --git a/model/model/layers/4/self_attn/k_proj/kernel/3.0 b/model/model/layers/4/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a990d08dbc72a0069d68665f447510f486d8d80e --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a11e14ced996e63ff9fc0a6767f381dd88240fdcc57bd3a2b595a0cff4638f49 +size 1234418 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/.zarray b/model/model/layers/4/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.0 b/model/model/layers/4/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac085864947a8f085d76e81be05ab8d590c7ca74 --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f93a00081cb34f4056e4e3ca371a907484d4c0cde4f2dd4871518981e5f0eb +size 3672297 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.1 b/model/model/layers/4/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3a79e2107dc080b24f8f1d7d15b49bbe74e25347 --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc959cc3cb8724356c9b9a5f51746e58e4337f13052627795b6c4907b68a97aa +size 3672974 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.2 b/model/model/layers/4/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..1974f3d5adc352f6af73e74c7bd465e63544046b --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2399fc7f18e34131230a7df9283769711f4cad2cbf43d4b6c59b4e28147f5f +size 3672098 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.3 b/model/model/layers/4/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..34dbd03121f27646fc270f13f67ba28b117e196b --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c458c744ed546ab782e6b4803a5a94f3585bd05864cffb5dac58f314143b7b9 +size 3672977 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/.zarray b/model/model/layers/4/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/q_proj/kernel/0.0 b/model/model/layers/4/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..80164b98bb2c802b894f4df277c7ecfbbc3cecb9 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36103bca774548162bd32f3b9e6c004d70491a41e3bbea2550be358b5379f57b +size 3703397 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/1.0 b/model/model/layers/4/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7fecb9b0ebfe726dae15d5e5b96ba7995707c2dc --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b3cdb904892f28a2e5d30449bc0e91fabd1adf62de3badac320e559ee15238b +size 3703797 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/2.0 b/model/model/layers/4/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..77878a739d7216f110b2973ca9543acc3422578a --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89938e3665fe2f13546ad00c39c2d64cf00ebc76b4aee047f0e8d70bbf695c4 +size 3703242 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/3.0 b/model/model/layers/4/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..bfbb9dba655f8f68304f19739cd74dff461b8475 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3128d2a1b4f5439816a6e35aba9dc1f33fed814a0bce66e7ee2e2143844f7e33 +size 3705052 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/.zarray b/model/model/layers/4/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/v_proj/kernel/0.0 b/model/model/layers/4/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..15a2427de671238a4b5660a1e8bb78efc76487e0 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e683e529b488a02218cae16a9153f06fc7a9ad3f63cfa374dcd276e76b8782c7 +size 1227609 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/1.0 b/model/model/layers/4/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3023316846349a050ecac050e40326d0e3825828 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b6c973587be9a0841f45d6126190da775a9ddfc09d8a9288b9dc510f2f06e0 +size 1227266 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/2.0 b/model/model/layers/4/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee5fb9bd0e8980ae8deb933bccc2fc599c6676ad --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6343ed4db21799bf574b920acb525f99f88a696ed232978a1dc5cf4c1e4a39b +size 1227281 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/3.0 b/model/model/layers/4/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a7f19f79af84015ceecf447d98744810769550ef --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb22423c9b4f6bfd0ce7c7a1db7e54ad46e0364270851a30cd3e8ab79ccbada8 +size 1227235 diff --git a/model/model/layers/5/input_layernorm/kernel/.zarray b/model/model/layers/5/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/5/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/input_layernorm/kernel/0 b/model/model/layers/5/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..fb8081db7728df0824c3416075ddc2e22aaa92f2 Binary files /dev/null and b/model/model/layers/5/input_layernorm/kernel/0 differ diff --git a/model/model/layers/5/mlp/down_proj/kernel/.zarray b/model/model/layers/5/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.0 b/model/model/layers/5/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..023ec75fa3c34ca8af8207991bc5c91ed5ef7acf --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c83c86bf322a1497b9eaa784ed549abbcc7b78566299a892908a93e8534ebfd6 +size 9792797 diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.1 b/model/model/layers/5/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..be966535323304d13a076774c2bab7c2b7e3326c --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d717fe830c970b4037221a712006e1b9f7b6ac0018810da81ef7366aebb21e2 +size 9795157 diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.2 b/model/model/layers/5/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..89b397d6bd6ed8f6b2497901f4d8b7ab00ade104 --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75ca63d1a8231bbca2d548bbdc7c95f7d65f6060e48127b64e1df55d26c2c2b +size 9792198 diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.3 b/model/model/layers/5/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..64df958a3d6807c453fb1b7d9f7826679ef2f69d --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40badaed9b8aa8e34a8dbd94aaf79c9d5dda1fada56f5e1b9936f2c01fb43fc0 +size 9795193 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/.zarray b/model/model/layers/5/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/mlp/gate_proj/kernel/0.0 b/model/model/layers/5/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7f5eed82bb50dbadb574e846f46d92eebc0afe11 --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b714ee4aecae14ac63d09aac5269da1f1e5e006ff50f0bc0fd3b7f8a6a3b9e +size 9815111 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/1.0 b/model/model/layers/5/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b7a5adea433779aa011119f7847454eab5efa6f9 --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a183bb7e2bbec75330e68c9d99252308157ed2c494f8c912a714ccad8ea71886 +size 9813412 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/2.0 b/model/model/layers/5/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..039094032da797678a30451c4b4c294987fed5f6 --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a02e9063285aa944fe15a50684ab108408a1d60e96d661bd4bb1bf296455d1a +size 9814457 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/3.0 b/model/model/layers/5/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..63bdd2602bfd525386ffbeeb84d55a2504e33c2e --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783e355b2974882de8234e570e5dd6a0017a23ade6f9cbee4dc89d711411a683 +size 9813956 diff --git a/model/model/layers/5/mlp/up_proj/kernel/.zarray b/model/model/layers/5/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/mlp/up_proj/kernel/0.0 b/model/model/layers/5/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..470b47c2f23d475a8d2bb2faf50d2dfa4110e1d5 --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87ffe3f69b8b9de924bf3ae14775466b984de43e6cb612d4649e39662987a90 +size 9789114 diff --git a/model/model/layers/5/mlp/up_proj/kernel/1.0 b/model/model/layers/5/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f8201dc40f23ca234214bfc0f5a2ab7d2a861e8f --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66a444d4a46fffc7312dd86091a2e0bad4cc08fa6c1f83eae16833af820917a +size 9788832 diff --git a/model/model/layers/5/mlp/up_proj/kernel/2.0 b/model/model/layers/5/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..38d46a34a20384d4d76fec9a7984b500c279270d --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5886f6b334ae8f3e5f5ff32b9c8be571e59e26c93d215953b1885d5b522add3 +size 9789425 diff --git a/model/model/layers/5/mlp/up_proj/kernel/3.0 b/model/model/layers/5/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..436b83a19df221868ad1443c5394a3fe4f686076 --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a058d1e27a8c4c11e9e2717eb80d2c2e1563eed23f2bd39b821c871b982a473a +size 9789040 diff --git a/model/model/layers/5/post_attention_layernorm/kernel/.zarray b/model/model/layers/5/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/5/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/post_attention_layernorm/kernel/0 b/model/model/layers/5/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..d29e4a13c6c94e59fbde4668206e65bc19f72b11 Binary files /dev/null and b/model/model/layers/5/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/5/self_attn/k_proj/kernel/.zarray b/model/model/layers/5/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/k_proj/kernel/0.0 b/model/model/layers/5/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ffe90b486faa978657617dce51dcc7063600c222 --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f4b5141339916a3dff2c87f28440ac61b07d98053f55abf94a05b8275df256 +size 1235371 diff --git a/model/model/layers/5/self_attn/k_proj/kernel/1.0 b/model/model/layers/5/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5bc1df504e4469c9acfe55a5828f5dd300bee0aa --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d208c385d9af1f039678d254cd6b2dc51c83893cff61dca11ed255441c85073f +size 1235334 diff --git a/model/model/layers/5/self_attn/k_proj/kernel/2.0 b/model/model/layers/5/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6e244a1b7f88b17f75537b877bceb963acf5244c --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19cd2cca22ac904c32877b640ca81fd48bad8a0a0c58a788fba546c49b1fce8 +size 1235662 diff --git a/model/model/layers/5/self_attn/k_proj/kernel/3.0 b/model/model/layers/5/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a0cc8fd85f567ac87def166d4e257b6240ee4bce --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72cff9f7e760e34c3400b746ed76fe7e1a4e8ff25f5761562a73303e55fc1f6 +size 1235525 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/.zarray b/model/model/layers/5/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.0 b/model/model/layers/5/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..12efd0bfc05e38d8a1f9108c98e0f0d68a539fb2 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9d2c881a842d642bbd766a26c201dcc21eaf2ec1da0b0eeccc4a7be2779743 +size 3670630 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.1 b/model/model/layers/5/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6f318eb33dd88f0cc146d95264beae5a38bef6f8 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c99fdb28c8f6f8ff021c754a2a048148cd2dc6e883296746f7a31909f37d38 +size 3671059 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.2 b/model/model/layers/5/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..bec236519091824bed21dd4ae4fa8efebabb8120 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7075523015e5b45c75e9e9afa35cd61f1d72439f516d49767963637b5fc0f329 +size 3669558 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.3 b/model/model/layers/5/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..fef589b9390e4d08d919a7f2359b69f612a77ca2 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db3c05a0bb2b6af1349d4bebb16e54de0747c4560044321f3224860b34ca3c71 +size 3670763 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/.zarray b/model/model/layers/5/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/q_proj/kernel/0.0 b/model/model/layers/5/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9b03ecfe84b7f48aac733749c244ebb333a3fcd2 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f38d0ba0d0d471a39e1f6c3fdcaafd04f8670ddf0ed7f91ccf49079a57502f +size 3702467 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/1.0 b/model/model/layers/5/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e86ed15639c3a962693a82a01a3fe7cd12523c1 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a100ecc773c9efa03a294ab5e0c219128a38de8c24b083acca5664154e0e4c94 +size 3702397 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/2.0 b/model/model/layers/5/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..4c5a9575e450c774659ba5116f09d729100e5029 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e3bc4db428594f2f8b000fc307050b0d55a43070d1188d1329c3aff1df9219 +size 3702128 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/3.0 b/model/model/layers/5/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..66969b4aeae0f1605af26c06b202d0d5a9ca7389 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c7e29b2545c9670f4b938195c9d4eaf769e8d1020d686600d8b57367cb4027 +size 3702400 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/.zarray b/model/model/layers/5/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/v_proj/kernel/0.0 b/model/model/layers/5/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..926d61fb9dfad80a2b85f8f360d2344fe08d496b --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad546cac4dcda5f150697bf57d1335298f5cfc50070f0c3ea82cba3e35f62c0f +size 1227219 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/1.0 b/model/model/layers/5/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..94e65390c2bd5c9ee0a7ae96a3bb14713d93a768 --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed70b8236644cbb9f29c6376276bc9ecc2ccc823fe3ddbb6ff371f1464d52d9 +size 1227218 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/2.0 b/model/model/layers/5/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a756cc25c8db900ac08c16233f9f640f9f5dcc5d --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ed7dfb0bc98c3c37f6343d83247b06d18c06a7a256fddf8ed3ed827d9e3dab +size 1227091 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/3.0 b/model/model/layers/5/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b8533b98bd27ec044589468ca4237715847e2d3c --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a8e5bbab7de1ab367bd839e2feba9f591fcd2a93db6811ee00f92c6a04f0a8d +size 1227235 diff --git a/model/model/layers/6/input_layernorm/kernel/.zarray b/model/model/layers/6/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/6/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/input_layernorm/kernel/0 b/model/model/layers/6/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..1594f90011497fade59fbed8351926df27edf053 Binary files /dev/null and b/model/model/layers/6/input_layernorm/kernel/0 differ diff --git a/model/model/layers/6/mlp/down_proj/kernel/.zarray b/model/model/layers/6/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.0 b/model/model/layers/6/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..baefde413df643e58c5089ba98cfe0bc607c06f7 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1af625c2d86aed22de9f17a543c105455fca79e134ab09979e447b462046c6 +size 9796347 diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.1 b/model/model/layers/6/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..461dc874aa0ea2ef0e7bcf439765b0e237547821 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeeb17b3af7ea814101fac45a4e0f3361689838136ab0d6afeedd811ff38ae33 +size 9798960 diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.2 b/model/model/layers/6/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..753e1e7b8701b4c6196dde5abaf6a68394670736 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1076cfcde135762139ff3487cd1b6d41c9539a6c2aa35566fd451c13ed458c4 +size 9795049 diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.3 b/model/model/layers/6/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c1b5a48fd8aa715aca6b4a953eb41bc28826dbd7 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a01e3ab9a46fa3acc8155caa6c4fe9907fdd053cc369cdf896c41ae3403923f +size 9797526 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/.zarray b/model/model/layers/6/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/mlp/gate_proj/kernel/0.0 b/model/model/layers/6/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..61160d40691acc7bba6de675d6a8d5ceb53da430 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:343024d5849a76b5b09fcc9ecae43f40611b4a258dcba8350a5212565093f15f +size 9815208 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/1.0 b/model/model/layers/6/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d358004cb31d493df5ab716cdac3893459746f8 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057fc4ae335e40826882408874c6c5077f3c77b977ee1d24a04899f90a26e54e +size 9813786 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/2.0 b/model/model/layers/6/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..554dfa7fa66e529ff84221d1b52c3dca0deebac7 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8af11d79fdc566b95825c0e257c0c5c7916cdd2640700405232e36c1e46a5d +size 9813442 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/3.0 b/model/model/layers/6/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..4572ffedb79bbf5a623ee0f4e12aff2923978ec5 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600761dc1459e3641e516521812122de585fbfa1560018e96e6ed9270977d87f +size 9813889 diff --git a/model/model/layers/6/mlp/up_proj/kernel/.zarray b/model/model/layers/6/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/mlp/up_proj/kernel/0.0 b/model/model/layers/6/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..64a90d31f7fd55d3cef21cbb9ecb23e6b848f193 --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a1699f64deba3b661501c17360e5d8f3a7feee5f3e03d1a1afbbab8198ad2f +size 9791407 diff --git a/model/model/layers/6/mlp/up_proj/kernel/1.0 b/model/model/layers/6/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..994ba884779589eaa85a54056ac5b3b327b8faa6 --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c694bcd4204a63acc88797d8367380b364061705959505e33f8490984aeeb61 +size 9791623 diff --git a/model/model/layers/6/mlp/up_proj/kernel/2.0 b/model/model/layers/6/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a9ace3f04be78b95d0ef50cacb9a5adef3ad3c45 --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdbd5afca0f1c773189748a03a7631a0ae50609b12b1d617cfb9893d87d7467c +size 9791587 diff --git a/model/model/layers/6/mlp/up_proj/kernel/3.0 b/model/model/layers/6/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..77dfd286b4901bba135b1859fcc2f1bacc6d94d9 --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d3c09607be17c678608289111d3b24c10edcc7524703efeb975521fe1fd130 +size 9789226 diff --git a/model/model/layers/6/post_attention_layernorm/kernel/.zarray b/model/model/layers/6/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/6/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/post_attention_layernorm/kernel/0 b/model/model/layers/6/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ee87ed6498f137739a6fd8ff7dc75d8d5edd43fa Binary files /dev/null and b/model/model/layers/6/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/6/self_attn/k_proj/kernel/.zarray b/model/model/layers/6/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/k_proj/kernel/0.0 b/model/model/layers/6/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2d1663ece6428ff15044611aefc8dd270d46a4b3 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21206690e2d3f89633dd0c71dc0caa6a12eb67246455a40ce7d1272caaf0ccc0 +size 1233114 diff --git a/model/model/layers/6/self_attn/k_proj/kernel/1.0 b/model/model/layers/6/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2deb0f34840068aed13245deab0fa07db08ea116 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916b0e01ece02f12b4a33e87de003376e695a777ce21fccd815b3de87e2d793d +size 1232446 diff --git a/model/model/layers/6/self_attn/k_proj/kernel/2.0 b/model/model/layers/6/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..16f2a7839521371224f5925d1dbaa33afd056b02 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb4250d49aa1a9e721222a931bd770e7447d40ce6ccf585982459dc4f729249 +size 1232631 diff --git a/model/model/layers/6/self_attn/k_proj/kernel/3.0 b/model/model/layers/6/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..06ff1dc4722fcbc7160865eea4350288dd5d9949 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e71b9f63e606682de53ff73106a6f67bde672c59026e4f4ade27b24fbfff94 +size 1232520 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/.zarray b/model/model/layers/6/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.0 b/model/model/layers/6/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e7c5c810a73325a8462c67d57b2505704c8034b --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b0506d92f6e48c31ce1ba9dc00a834df4d7d1f44086ca0c411f24e351e56b1 +size 3667503 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.1 b/model/model/layers/6/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..e2dd8e07d60069c45686e840cb6f85209f8525f6 --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4504423b73637d9a44b36c22389331e8d4386f53c7630042cda6b6e303b333ac +size 3667876 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.2 b/model/model/layers/6/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ef70f94bf35234aaec680500e1ac0a29ebe27a85 --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d5248ca549b352b7136a7deabae29eaf64fdc6a7c8bc6dc4366e5e5e145e4c +size 3666862 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.3 b/model/model/layers/6/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0472674221c6c56233402271d66d3eb65db60ca2 --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0180d7324efffdb2ab24ec5614a689888a5728eb6fc36be753a2726bc9cd5617 +size 3667775 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/.zarray b/model/model/layers/6/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/q_proj/kernel/0.0 b/model/model/layers/6/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0fa0c2fd93a71532d28b5688515e1db04d72875d --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf5514f9c898cf742e0418c8cfb4e66d79ffcfe19aa4eab33b19a6352d7618e +size 3701043 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/1.0 b/model/model/layers/6/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..138b0f2ae81c4d4436a0e14f29a9f04fdb993559 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00ecb5b0ef575732a33cee29a19d95ba4aec8409f937b76549a86e5b4d72930 +size 3701207 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/2.0 b/model/model/layers/6/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fa04f8a48edc20a3847418ba53ec0fb7f4d82918 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3987380ecc290ebf94363e9a1398b0e1959a8e80653f12ca5aa15b9024f75e0 +size 3701171 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/3.0 b/model/model/layers/6/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..291655bea0a662f688a081364d637d26aaa190aa --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd5278a53115923a2694177cfb628097060ac1c2da86c43f63e6ba073a0643c +size 3701192 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/.zarray b/model/model/layers/6/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/v_proj/kernel/0.0 b/model/model/layers/6/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..23f4a4ea2adcb7ab62cf487390e2c1ecbbd43275 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d35592fdd56dba761a97016b27a714a7819db6f69e0374c0d7a2e6ddbf1b633 +size 1225514 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/1.0 b/model/model/layers/6/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..cefaaaf776fdfc534e92f3b32ffb8b5c7d50578a --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc84b9cb7f375ecc6f6ee8f9752dd06871196a78a54b584834fcde1b9243f3e +size 1225517 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/2.0 b/model/model/layers/6/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d433daff0b67366a855ef2e6f78312ebabd03c3f --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55d7b9bba76a998e7d6b53af7d69d34242549156f3e5135204122e536c9b9c6 +size 1226111 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/3.0 b/model/model/layers/6/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1a7ea6267dd27f65fad59614ebeb114813b42c30 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35673ad4c45bbb19d386995e29f2ca24313b16f1d8ff774292a0dc9dc445271 +size 1225253 diff --git a/model/model/layers/7/input_layernorm/kernel/.zarray b/model/model/layers/7/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/7/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/input_layernorm/kernel/0 b/model/model/layers/7/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..9d61fd19fdef4aa644ec8227d512a439f9fe1b44 Binary files /dev/null and b/model/model/layers/7/input_layernorm/kernel/0 differ diff --git a/model/model/layers/7/mlp/down_proj/kernel/.zarray b/model/model/layers/7/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.0 b/model/model/layers/7/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6137ef4d103266dc42f83bd8cdfb5d3b8e28525f --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:540c3d5fddc3247e68b5cb441719d04385b55875086d188fcc470c163a54d613 +size 9804658 diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.1 b/model/model/layers/7/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ea67735a9623a97bd3ada3abb63593f378639dca --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f4210b85d196414b2155026d3ff3b0844eb09f637b9b6f22dd7f7d29cf4c82 +size 9807613 diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.2 b/model/model/layers/7/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..3c51750038110e0d7eba2ff51cd6499143c57e7f --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5eb7e7a5c186e9db3b135370d1a81ba8a7764e68ef25b2f0ec62258b3490b91 +size 9803273 diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.3 b/model/model/layers/7/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..d2988bdc552190b3474af63b57008b43b776229a --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ddde94eebcfd2c4be6af0e651c7f1e084167333f0c97fcdf1568b13db4083a +size 9805472 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/.zarray b/model/model/layers/7/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/mlp/gate_proj/kernel/0.0 b/model/model/layers/7/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1fb8cdb72786cf2835e1366c93b38502dd0e9a81 --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31512154f8bc8d2b4f9ba62a2d6a86ed3b0b5a886f876193c40796caa16c47ad +size 9813736 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/1.0 b/model/model/layers/7/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..cd36c8c45d12febdfabd2335e8aa0abc06d9187f --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09cc4de88138299800fbed44e5ee07bc537287d8082fe26ec581ef184b62ed8 +size 9813633 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/2.0 b/model/model/layers/7/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f29b4f8b90082103c4e422b571292b834db1947b --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe400f1cf8197eda22615ee555e5825b6db834d6743cf33ee3be57310f23b1b +size 9814270 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/3.0 b/model/model/layers/7/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5fabb427614535d132c4a7553f1b85759f66da48 --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:457be7bba99eb27a69d1e75456f984ebaf5c5d8d2665261feedbb0104cff098e +size 9812569 diff --git a/model/model/layers/7/mlp/up_proj/kernel/.zarray b/model/model/layers/7/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/mlp/up_proj/kernel/0.0 b/model/model/layers/7/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..573ac84371782dde81f44511d0abff7ecb38000d --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d4082dc7541ebcc317c3994eac655dfedca3c2b7072ec7ca5853345063c3cc +size 9793707 diff --git a/model/model/layers/7/mlp/up_proj/kernel/1.0 b/model/model/layers/7/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..578ca4a1ed694c43de513cca19f487decbbd4927 --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:298ceaea8fa8856378e1ddcb9b41efda316e572973da4110d46ec4830a3947bb +size 9795567 diff --git a/model/model/layers/7/mlp/up_proj/kernel/2.0 b/model/model/layers/7/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9956e51b18648831e4aa536684dd8860875e46cf --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7e8c14ec9cada2f90370776b8081f2eaab7aec0065e1e5d7e2208007e52d78 +size 9795592 diff --git a/model/model/layers/7/mlp/up_proj/kernel/3.0 b/model/model/layers/7/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f66ad317128d60f7be891eb51278b397a7add652 --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2f78712928e3631474657d4972a5b5636d64cafa1dd9f30c34231c1f35c309 +size 9793195 diff --git a/model/model/layers/7/post_attention_layernorm/kernel/.zarray b/model/model/layers/7/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/7/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/post_attention_layernorm/kernel/0 b/model/model/layers/7/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..3a3559547a2358cc4f2b927970598d5c6e1312d0 Binary files /dev/null and b/model/model/layers/7/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/7/self_attn/k_proj/kernel/.zarray b/model/model/layers/7/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/k_proj/kernel/0.0 b/model/model/layers/7/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4567307975159b84fa098ed7f5d69ba0fdc699d9 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36c13844719c1e5185280d56d3cf45ad72131a8efcd3b573f347465b7607594 +size 1233345 diff --git a/model/model/layers/7/self_attn/k_proj/kernel/1.0 b/model/model/layers/7/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..25cd7d271fa9e3663ce9942421b3e4276d680586 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054961c929c3c5b23f664123c6d12b8debe0929fa0200aa96067bf25f4cce356 +size 1233141 diff --git a/model/model/layers/7/self_attn/k_proj/kernel/2.0 b/model/model/layers/7/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..145c6110477c839cb19374b61d6ec80c5eb7a5c0 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86cf98be1dca1b1e42a2eb114e3d8056735901e7a70179ead95d256cfa81c79b +size 1233282 diff --git a/model/model/layers/7/self_attn/k_proj/kernel/3.0 b/model/model/layers/7/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c83675ddf651279fd4209672aae5d674985d1c4e --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083891ef042008949b484daa546534ef3f26be010eae29611521f1d964da9f28 +size 1233354 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/.zarray b/model/model/layers/7/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.0 b/model/model/layers/7/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f0040504cb18284da5c76e275dd9b8909214c344 --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea5bf645799505578df320883eb1a28cf8f457d6677cfc1faf26f4470d0c3c4 +size 3672840 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.1 b/model/model/layers/7/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1e5f8fe825b66e62371eb65e667a0665493f249f --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170d57eccc733ad93b3ff1146d16fe4bdfb8c0b5dd6e73c86b9193d4574216c3 +size 3673344 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.2 b/model/model/layers/7/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ecd3679b0f14e7288eb56b6c2066d28cb5ba684e --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b6b0e5cc6ca9b3ce04b9f23065182f95b8350bef2ac385506b571f4655d8b1 +size 3672139 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.3 b/model/model/layers/7/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..6e4ab38782c6cca5a80e8d1349ab8632ddb19207 --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9031ae63d5b7d7881ffa899fa01b7113fbb8c6957c8f772e5d1c494074879e0 +size 3672518 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/.zarray b/model/model/layers/7/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/q_proj/kernel/0.0 b/model/model/layers/7/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d14e0416d5e8cc7ca28ff228c8371d98335356a8 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7e4e97b8330ff997af280593028418d8f6be164906e3f6b7c5c6a828af5190 +size 3703347 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/1.0 b/model/model/layers/7/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..4a4c481ebc837f341c4e918b5f1cf0364129d16d --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1c7b497f0eae7a6199d72536e10ff726ac7832ad8075a874a48a24b5ae86a1 +size 3703415 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/2.0 b/model/model/layers/7/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3bc655b0211abed0b79168fbc2ac911d62474330 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01668a97fb086c900eb4e1024ca88863e20fbb53be2c531ac78bc005b1eb74ec +size 3703107 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/3.0 b/model/model/layers/7/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6767704b67cea0e350a8f69cd0f7e2429e475358 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba9d1549775685ad825d5c493afce5e13dade3df650353d134d445d59119595 +size 3703603 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/.zarray b/model/model/layers/7/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/v_proj/kernel/0.0 b/model/model/layers/7/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3f4a757b7b0b3340f3ba2fc679c754cc24796f20 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49d798d1e5abe332f5e507946e2ec14fbb9f9986610af03c68053adcb327a92 +size 1226469 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/1.0 b/model/model/layers/7/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..73533e1771fb81205959d48328bb101d43da17d1 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8304b413040f339d5e6ca7c998a61b63f89b083a0a5b86e6b4eb5df35cf2839 +size 1226347 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/2.0 b/model/model/layers/7/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..bd3a8d8d2111c1c1d7adf72939a3c0a893dc0b68 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3eefce90559205ed0437899e2f32206bc23780fde7b8e5cd884d4382bc04e57 +size 1226299 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/3.0 b/model/model/layers/7/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0f1c9bda8e046c5ddc35189479454f371aeab1b4 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18289b0ef804c0dfe29449c443d957f47a3f7ee5f4ca2f75e96333c2f414ff3c +size 1226004 diff --git a/model/model/layers/8/input_layernorm/kernel/.zarray b/model/model/layers/8/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/8/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/input_layernorm/kernel/0 b/model/model/layers/8/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..d3d205a3fae32330f226966542e69a384c8c0328 Binary files /dev/null and b/model/model/layers/8/input_layernorm/kernel/0 differ diff --git a/model/model/layers/8/mlp/down_proj/kernel/.zarray b/model/model/layers/8/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.0 b/model/model/layers/8/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4c3b817d4dd6d0c36e4ed03da3b8071c54026ce5 --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0577d08e7dd948801528e69dc2aeb365994d7a5388eede8299c661acc0474b0 +size 9806623 diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.1 b/model/model/layers/8/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..a58f96d5ab0dc97bd77178b1f79efd25583dde9a --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4fd5616a423375efe4d18022e6f97dd31eca0a1090538c02b93851a130410b4 +size 9807823 diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.2 b/model/model/layers/8/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b1ebc2132de5f5fc35bc057087f58804293c010d --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e32d5c6203c630fe77fed035a1bef108da2f226445b881f4768a63a9bf6055a +size 9804061 diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.3 b/model/model/layers/8/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..63ac4afab0df81d9d347b9b84bf99cbf9509c8be --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d72c6cc4ce58fcb855d3b72da5d99e077832201d67a71e5c3d72839eb26ef82 +size 9806945 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/.zarray b/model/model/layers/8/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/mlp/gate_proj/kernel/0.0 b/model/model/layers/8/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1c84d8f903a8b0f2212a86403c75191d8b2727c4 --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa716757d932ccd2bcb56beff8ee51f07eb9508e52c35eee638601aaaa271ec +size 9814822 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/1.0 b/model/model/layers/8/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7b07a4b25e616bd0386da27b6d4c867470b26f6a --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:392b3024df2dc1a72614f7cb0dd9a36de4208c00d0ba71d5eed591cd6e74b915 +size 9815013 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/2.0 b/model/model/layers/8/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a0210614126c8a60d60b20010f6e5ec37cd93452 --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3f0ac072f0bc1c1eb4634184aec9ca56ae35ec05d66c84cf1515fb0bfd77af +size 9815537 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/3.0 b/model/model/layers/8/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d009eb5ce6015c3f952368bb766b9c3e5f4b0fc2 --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d910b12a9bff2b1cfd625622634c8306b0392ea9a091eb45064620f7d3b1533b +size 9814912 diff --git a/model/model/layers/8/mlp/up_proj/kernel/.zarray b/model/model/layers/8/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/mlp/up_proj/kernel/0.0 b/model/model/layers/8/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6fbef5e1e9332dd3b2f3420cc081008e7e67fa23 --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68bb143d249ded5106f679c9a81df6c7f4076eeada98d28a6b5a2ab890172d70 +size 9793969 diff --git a/model/model/layers/8/mlp/up_proj/kernel/1.0 b/model/model/layers/8/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..72bb63073e061595871c6456c4471d0b839a8be6 --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5958b1d0d589b73d8715f0da81a405a3ef7524bd83cd1a43733aad1d42aa2aa +size 9794986 diff --git a/model/model/layers/8/mlp/up_proj/kernel/2.0 b/model/model/layers/8/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d6f184d1e8fa7afa292ecf47de80fb23460df638 --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c1ca5261dfaaa68f62e94cd4c67bf8636ddc3e15c2f3794c4cef5df4419205 +size 9796501 diff --git a/model/model/layers/8/mlp/up_proj/kernel/3.0 b/model/model/layers/8/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..44f212217d59b118e591df3bfc9d5ef9fb944f02 --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65cd7c4f809d2012db9f4188e086aee1b1f1a92c8d908d17ba619e77797308ec +size 9793300 diff --git a/model/model/layers/8/post_attention_layernorm/kernel/.zarray b/model/model/layers/8/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/8/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/post_attention_layernorm/kernel/0 b/model/model/layers/8/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..b53ee2deb64d14a974b1baeb8fa0c98d71efd231 Binary files /dev/null and b/model/model/layers/8/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/8/self_attn/k_proj/kernel/.zarray b/model/model/layers/8/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/k_proj/kernel/0.0 b/model/model/layers/8/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..04c39e58a832265317238ffed9fd4e90352b2afe --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b852ab1483d61a921e824b6a4a009943bf9023dbd26ac7a232a5138309b3fcb +size 1235232 diff --git a/model/model/layers/8/self_attn/k_proj/kernel/1.0 b/model/model/layers/8/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..413f3f2be271f280afbcf1455aaa86f0d0305912 --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6796876633cb4b5d3cbc3ccbb21946dfd8bab542148a5d6aca3f03b067706c28 +size 1234939 diff --git a/model/model/layers/8/self_attn/k_proj/kernel/2.0 b/model/model/layers/8/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..95e466301742a34f6dc2a8b34400e830bef9ec1e --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653d668f0c3121163d409f7a0028cb69e86185c7063b2a75374bec2d911cbf20 +size 1234722 diff --git a/model/model/layers/8/self_attn/k_proj/kernel/3.0 b/model/model/layers/8/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..fcad16af9a020e1d3ae4f586127285a30ac7381b --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e65164f8281d6cf734cd1d57c1aff5648fde59574e02d07333a1177f34e91e96 +size 1234927 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/.zarray b/model/model/layers/8/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.0 b/model/model/layers/8/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e64cb7e644b053ee7fe9e1a4cb24ff0cfbd50bcb --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7213e704dee70cfcaf3abafe2cd28dbc6063fb318128a06c3853bbac2a8304 +size 3673732 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.1 b/model/model/layers/8/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..46b6f1d9dca949eb201478b18740a273d5b8440e --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c98486d9ab6bd0c1619aaeb99460ff2f110cd12e661882479522c5882aafd658 +size 3674815 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.2 b/model/model/layers/8/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..4002967e23db0178fb76e65daf8b7d066dc4fb52 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec849886893d8ffd5e6afb6f1eb63dacfba2a765514cce282a0cb02e9eb6a87 +size 3672621 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.3 b/model/model/layers/8/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b081be4c1bf85276df0f9f60bf22bf1196048df9 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab384d5d398447827722576ddd6afe2ac7d91afb78649dfdd49664ba50cce3e +size 3673138 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/.zarray b/model/model/layers/8/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/q_proj/kernel/0.0 b/model/model/layers/8/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fdec78ea7d903ff87884bac289ee49ecbba5a3c7 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2706088277b64a8a4560c974e297e7ff75019fb5b1ff72f5c80338ac41f8c3d2 +size 3702351 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/1.0 b/model/model/layers/8/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c502801d950dce3fa559d47759ef5f4b430b20f1 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfab1700c008ce7ec1a3993303390a8050574371032fb8877d62c8ad1bcbfe2a +size 3701811 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/2.0 b/model/model/layers/8/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..2fa027b362b9560c64a40e9a1bb75caa47d8070f --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79cd8a3e47bb93298407dc13169dc639627f5989173f26250a13337167851490 +size 3701936 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/3.0 b/model/model/layers/8/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..bacc3c8c7f72ae276af318e8eb26dccfc70d3541 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:338c6c3c1efacac4cec65d9058ddd1739c1e97b34ed66b0b72805ab77be8b92b +size 3702100 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/.zarray b/model/model/layers/8/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/v_proj/kernel/0.0 b/model/model/layers/8/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..24f8cace08d7abe4d43526a4b347055eaf7a8116 --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cadec00cf9dc5b43709fb69cdba333e22344ee6ed7fce9908b3510e641a3ae +size 1227484 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/1.0 b/model/model/layers/8/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1a116bf5a356c1ba2f7f9777cec7c8163593269f --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5001f43662a4f4c21520b5fd8c770516ea9d41a04ad2301994f6d99d9d7c5f6 +size 1227487 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/2.0 b/model/model/layers/8/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..33a9170a24506918cb2baff4f3c4ecdaad6aaf59 --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0b0689ac8162d629cfdbc76811aa31494f84819a647c552ed426c07daec418f +size 1227244 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/3.0 b/model/model/layers/8/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cbf89e3b30deac43b9548e7e8d3e51681f6e6507 --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e75ee6fae5e5cd28df3b73429c18a38073bc6fafe712d54978c14262b107bf0 +size 1226489 diff --git a/model/model/layers/9/input_layernorm/kernel/.zarray b/model/model/layers/9/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/9/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/input_layernorm/kernel/0 b/model/model/layers/9/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..3869db9df8ca75955a4e139be028630329b7a7d0 Binary files /dev/null and b/model/model/layers/9/input_layernorm/kernel/0 differ diff --git a/model/model/layers/9/mlp/down_proj/kernel/.zarray b/model/model/layers/9/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..aa9dd4be5a58fccc89de5e44e588dbcdd72cdacd --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.0 b/model/model/layers/9/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..244c6d485b2b71d15a1338ff6ba806adabfb57bb --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256e9e8c57316ad428d45d7e4bc9d4ccb174977507c0256e17db52b82ae8bcb0 +size 9808332 diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.1 b/model/model/layers/9/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3396f658da7522845ccbdf110718a798ca3e1fe0 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bec1b4daaf994f8d9d52f95be88e96680fa99e94df8ce5c5e484473c9563eb +size 9811738 diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.2 b/model/model/layers/9/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..c7d23204a877fbb50eab9bfb896a83866abbde99 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10e2f8ae279d8cfe4b0d2b42314eb9a2fad3cf9758ad6986f3b4cb37c9057a1 +size 9807336 diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.3 b/model/model/layers/9/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..990b1ace9f1c99ad14e09d8c1c000b3db6845e49 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c32536f251555a3ab910bd9e54f523043110a8a21e0d3e253c7a5c33a6bdcf9 +size 9810130 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/.zarray b/model/model/layers/9/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/mlp/gate_proj/kernel/0.0 b/model/model/layers/9/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..197faf95154c2b070ed443bf10facc72ab164974 --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e659894423361b688d1e7736adaa8d9b25de88c5c07bff04d6d6cfde268b538c +size 9813502 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/1.0 b/model/model/layers/9/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1daa72b28b448fece3c814e6cc6d63861eed19e9 --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8cd582a69fd3b0b4b359e0dad0d496a4d45e7412db5aa8a2d457d8894ee64ea +size 9815481 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/2.0 b/model/model/layers/9/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..67440bd4c5153dd81db1b1ff82332406f3135092 --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ccaf6a61ab5d4a7fc06c676e7583e043467e8bbe97f334e7fb332db4111913 +size 9815080 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/3.0 b/model/model/layers/9/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..dbd35c7c8547121eccea621baedb4852aa3b5d38 --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:211acf407a3044291f00b044eb3ef927198f1fea821622996a7202aed851593b +size 9812799 diff --git a/model/model/layers/9/mlp/up_proj/kernel/.zarray b/model/model/layers/9/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..ae4d767e73f006afc7c6ba7399677250bb7f364c --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/mlp/up_proj/kernel/0.0 b/model/model/layers/9/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f1507aa59d8f7c711bc317feb2c72e57840d2f81 --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a581271312e03b65f453f3760ad4831c2409fc6ed4773e56ef8c9c335d0c5152 +size 9797037 diff --git a/model/model/layers/9/mlp/up_proj/kernel/1.0 b/model/model/layers/9/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b3c9f200477c2c830cc8af5e2f7b6236caa81f86 --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b06bfd0a8bac910c47ec63dfa1d3b768eee9845b474feaf833639ab520f71339 +size 9797544 diff --git a/model/model/layers/9/mlp/up_proj/kernel/2.0 b/model/model/layers/9/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..be39c60681810d2fb51d1570aae15687560cb8c1 --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92807d784ac5d538c447ac69c0153615a94fec6c6a9e5f487a84be826a998e1 +size 9798461 diff --git a/model/model/layers/9/mlp/up_proj/kernel/3.0 b/model/model/layers/9/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6b0cdc81129543f3fdd5930c7b0141ee69598c8d --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4195c8f6a991b1a018dc92d07a2bde3a0ac0ba46813a51e1cf18a4f3d2b513a +size 9795775 diff --git a/model/model/layers/9/post_attention_layernorm/kernel/.zarray b/model/model/layers/9/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/layers/9/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/post_attention_layernorm/kernel/0 b/model/model/layers/9/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..b9eec9cd6a6f1a4f975fccc753a758db3db2b0da Binary files /dev/null and b/model/model/layers/9/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/9/self_attn/k_proj/kernel/.zarray b/model/model/layers/9/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/k_proj/kernel/0.0 b/model/model/layers/9/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf1407710c5b6c304fda6607390be7329e460e36 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a701623ed3100f94876c16047cd56a4e66b30c1a9083b5a798e39a4996826306 +size 1235327 diff --git a/model/model/layers/9/self_attn/k_proj/kernel/1.0 b/model/model/layers/9/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..921b35f16e11de6553b5888a6b662d58c66ad6e3 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d3c9cfe26ee7dcb35b8126e8ebb760c7d63f8f05c83f711c3edee24b29efde +size 1235069 diff --git a/model/model/layers/9/self_attn/k_proj/kernel/2.0 b/model/model/layers/9/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..47243a0469059b177548e4be613b0e3c10cffac8 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56305c0df10de764b933db8ac3ce13088a45f12c9a29f3b83da93f39dbd7e2cb +size 1235370 diff --git a/model/model/layers/9/self_attn/k_proj/kernel/3.0 b/model/model/layers/9/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..261d79f3c7716abd257bcbca39a28f3956afd8e5 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fff59797ed261d81590cf0cdf04c7d403e8670cd8e66d719a0e2331b500c4c +size 1234857 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/.zarray b/model/model/layers/9/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..c9e05e86af968d5b9e1679f6ea1190841d7e6f3d --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072,768],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.0 b/model/model/layers/9/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5eb5067aacae3ffd80228d9889974f316f53e1bc --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fab4c40e868c7027546a37256fecb0b9fed972c6036f334551bccdd53803090 +size 3676972 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.1 b/model/model/layers/9/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..5f63274bc09a05222a09974ebe8d932e522e6e3f --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792a40d16e9378c88e6da8eb5124585e97746063ed9c7316bd11cddb405600bf +size 3678166 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.2 b/model/model/layers/9/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..79df51352560e8362b974d32eb8135e6692ec4dd --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ee17e44b740a3f437369146086cce9a265d1c03662111f3ab6a8f0832b7cdd +size 3676153 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.3 b/model/model/layers/9/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..98571763292fade6f3f2f4634e0919c5b8f3dc9f --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e2139b3972fac1e0e79e972892d308e82e76ca69a31bbeaf07aca3190cc885d +size 3676157 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/.zarray b/model/model/layers/9/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bc9454a239b78c9a19643d1d121676bfa890e1ad --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/q_proj/kernel/0.0 b/model/model/layers/9/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f092346d92268901ea7e93f53888f66e66ed9f0b --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d54262f5504bcb37df5c7724cb0a826a709c062266057622c2c3749219d93b2 +size 3702445 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/1.0 b/model/model/layers/9/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0462c84c5206d0242451442e046733830da0731e --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c1b79770890c0c58a663cfbeff5a999572c2d851cb75010f4b136225c95841 +size 3702557 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/2.0 b/model/model/layers/9/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc96f86c2562e08ecc81c361305ac7f559c6f04b --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0001fa081a94eff2700e105b4a9c852bbba36b043bc6a9d535b018b7e928d27 +size 3702847 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/3.0 b/model/model/layers/9/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3ba3d8d81e97b644f86975dfa19270830792a862 --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cadf7be0f97e636d7ad6695bafc9c44fa7259385a4c246d160c220f281f474a6 +size 3702633 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/.zarray b/model/model/layers/9/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9fb93b89ad08a24b38a706a6fd2aeeb8ec173f29 --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[768,1024],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072,1024],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/v_proj/kernel/0.0 b/model/model/layers/9/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab7b37a6654cabb304b9990d4f75002600f67e3c --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53892e3fb441cad2b632521c7c58ff12c95f609ba1875d1e42ff24d00005496 +size 1229777 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/1.0 b/model/model/layers/9/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a03345b535e8dfc5f83be98dcdf8a3f123f8ab14 --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdca227d9853ac1a98c20681c920a3e3a07efff46758ee9440bd10e955d13155 +size 1229664 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/2.0 b/model/model/layers/9/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d91a209e96e4fc4b64f3515ec0ed1546093ed0ae --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64bafd6ecaf55bce8c270c719a35150a4f25e708837cc3ca7851e0034256e4b6 +size 1229783 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/3.0 b/model/model/layers/9/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..66837ff4310329538f525c1c091ce5ebfc1855ef --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ad6381285be436709bbf65af021e3caae5a7017bdd573b2c58faeb7931597b +size 1228963 diff --git a/model/model/norm/kernel/.zarray b/model/model/norm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..25b3cb9c6cb257594fcad7b4784332fcc38265b0 --- /dev/null +++ b/model/model/norm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[3072],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[3072],"zarr_format":2} \ No newline at end of file diff --git a/model/model/norm/kernel/0 b/model/model/norm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..3ad0c86df76144dd4baf0b0648801cb94b1985b5 Binary files /dev/null and b/model/model/norm/kernel/0 differ diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..02ee80b6196926a5ad790a004d9efd6ab1ba6542 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,16 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tensorstore_index.json b/tensorstore_index.json new file mode 100644 index 0000000000000000000000000000000000000000..c7506f5a3fcb1f483188832fde51691c69f1d4e9 --- /dev/null +++ b/tensorstore_index.json @@ -0,0 +1,1983 @@ +{ + "format": "tensorstore", + "version": "easydel", + "prefixes": { + "model": [ + { + "path": "model/model/embed_tokens/embedding", + "shape": [ + 128256, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/16/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/17/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/18/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/19/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/20/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/21/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/22/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/23/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/24/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/25/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/26/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/input_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/mlp/down_proj/kernel", + "shape": [ + 8192, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/mlp/gate_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/mlp/up_proj/kernel", + "shape": [ + 3072, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/post_attention_layernorm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/self_attn/k_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/self_attn/o_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/self_attn/q_proj/kernel", + "shape": [ + 3072, + 3072 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/27/self_attn/v_proj/kernel", + "shape": [ + 3072, + 1024 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/norm/kernel", + "shape": [ + 3072 + ], + "dtype": "bfloat16" + } + ] + } +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1d8d5c9024994f1d3b00f9662b8dd89ca13cf2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b0c7c141373ca36e5e819a28f60e146ccef652f --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2062 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "tokenizer_class": "PreTrainedTokenizerFast" +}