diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..147bf30910f5dd6d87673bc5103750ccc555c24b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,456 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/embed_tokens/embedding/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/0/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/1/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/10/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/11/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/12/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/13/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/14/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/15/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/2/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/3/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/4/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/5/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/6/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/7/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/8/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/gate_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/mlp/up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text +model/model/layers/9/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..b2d1ce0410c7f49533a51e7c2e681d95713e15b6 --- /dev/null +++ b/README.md @@ -0,0 +1,159 @@ +--- +library_name: easydel +pipeline_tag: text-generation +tags: + - easydel + - jax + - "llama" + - "CausalLM" + - "vanilla" +--- + +

+ easydel +

+ +

meta-llama/Llama-3.2-1B-Instruct

+ +
+ EasyDeL checkpoint converted from meta-llama/Llama-3.2-1B-Instruct. +
+ +## Overview + +This checkpoint is intended to be loaded with EasyDeL on JAX (CPU/GPU/TPU). It supports sharded loading with `auto_shard_model=True` and configurable precision via `dtype`, `param_dtype`, and `precision`. + +## Quickstart + +```python +import easydel as ed +from jax import numpy as jnp, lax + +repo_id = "EasyDeL/Llama-3.2-1B-Instruct" + +dtype = jnp.bfloat16 # try jnp.float16 on many GPUs + +model = ed.AutoEasyDeLModelForCausalLM.from_pretrained( + repo_id, + dtype=dtype, + param_dtype=dtype, + precision=lax.Precision("fastest"), + sharding_axis_names=("dp", "fsdp", "ep", "tp", "sp"), + sharding_axis_dims=(1, -1, 1, 1, 1), + config_kwargs=ed.EasyDeLBaseConfigDict( + attn_dtype=dtype, + attn_mechanism=ed.AttentionMechanisms.VANILLA, + fsdp_is_ep_bound=True, + sp_is_ep_bound=True, + moe_method=ed.MoEMethods.FUSED_MOE, + ), + auto_shard_model=True, + partition_axis=ed.PartitionAxis(), +) +``` + +If the repository only provides PyTorch weights, pass `from_torch=True` to `from_pretrained(...)`. + +## Sharding & Parallelism (Multi-Device) + +EasyDeL can scale to multiple devices by creating a logical device mesh. Most EasyDeL loaders use a 5D mesh: + +- `dp`: data parallel (replicated parameters, different batch shards) +- `fsdp`: parameter sharding (memory saver; often the biggest axis) +- `ep`: expert parallel (MoE; keep `1` for non-MoE models) +- `tp`: tensor parallel (splits large matmuls) +- `sp`: sequence parallel (splits sequence dimension) + +Use `sharding_axis_names=("dp","fsdp","ep","tp","sp")` and choose `sharding_axis_dims` so that their product equals your device count. +You can use `-1` in `sharding_axis_dims` to let EasyDeL infer the remaining dimension. + +
+Example sharding configs + +```python +# 8 devices, pure FSDP +sharding_axis_dims = (1, 8, 1, 1, 1) + +# 8 devices, 2-way DP x 4-way FSDP +sharding_axis_dims = (2, 4, 1, 1, 1) + +# 8 devices, 4-way FSDP x 2-way TP +sharding_axis_dims = (1, 4, 1, 2, 1) +``` +
+ +## Using via `eLargeModel` (ELM) + +`eLargeModel` is a higher-level interface that wires together loading, sharding, training, and eSurge inference from a single config. + +```python +from easydel import eLargeModel + +repo_id = "EasyDeL/Llama-3.2-1B-Instruct" + +elm = eLargeModel.from_pretrained(repo_id) # task is auto-detected +elm.set_dtype("bf16") +elm.set_sharding(axis_names=("dp", "fsdp", "ep", "tp", "sp"), axis_dims=(1, -1, 1, 1, 1)) + +model = elm.build_model() +# Optional: build an inference engine +# engine = elm.build_esurge() +``` + +
+ELM YAML config example + +```yaml +model: + name_or_path: "EasyDeL/Llama-3.2-1B-Instruct" + +loader: + dtype: bf16 + param_dtype: bf16 + +sharding: + axis_dims: [1, -1, 1, 1, 1] + auto_shard_model: true +``` +
+ +## Features + +**EasyDeL:** +- JAX native implementation and sharded execution +- Configurable attention backends via `AttentionMechanisms.*` +- Precision control via `dtype`, `param_dtype`, and `precision` + +## Installation + +```bash +pip install easydel +``` + +## Links + +- EasyDeL GitHub: https://github.com/erfanzar/EasyDeL +- Docs: https://easydel.readthedocs.io/en/latest/ + +## Supported Tasks + +- CausalLM + +## Limitations + +- Refer to the original model card for training data, evaluation, and intended use. + +## License + +EasyDeL is released under the Apache-2.0 license. The license for this model's weights may differ; please consult the original repository. + +## Citation + +```bibtex +@misc{Zare Chavoshi_2023, + title={EasyDeL: An open-source library for enhancing and streamlining the training process of machine learning models}, + url={https://github.com/erfanzar/EasyDeL}, + author={Zare Chavoshi, Erfan}, + year={2023} +} +``` diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..1bad6a0f648dccdbec523ca79ba90fbcfc806af0 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,93 @@ +{{- bos_token }} +{%- if custom_tools is defined %} + {%- set tools = custom_tools %} +{%- endif %} +{%- if not tools_in_user_message is defined %} + {%- set tools_in_user_message = true %} +{%- endif %} +{%- if not date_string is defined %} + {%- if strftime_now is defined %} + {%- set date_string = strftime_now("%d %b %Y") %} + {%- else %} + {%- set date_string = "26 Jul 2024" %} + {%- endif %} +{%- endif %} +{%- if not tools is defined %} + {%- set tools = none %} +{%- endif %} + +{#- This block extracts the system message, so we can slot it into the right place. #} +{%- if messages[0]['role'] == 'system' %} + {%- set system_message = messages[0]['content']|trim %} + {%- set messages = messages[1:] %} +{%- else %} + {%- set system_message = "" %} +{%- endif %} + +{#- System message #} +{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} +{%- if tools is not none %} + {{- "Environment: ipython\n" }} +{%- endif %} +{{- "Cutting Knowledge Date: December 2023\n" }} +{{- "Today Date: " + date_string + "\n\n" }} +{%- if tools is not none and not tools_in_user_message %} + {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} + {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} + {{- "Do not use variables.\n\n" }} + {%- for t in tools %} + {{- t | tojson(indent=4) }} + {{- "\n\n" }} + {%- endfor %} +{%- endif %} +{{- system_message }} +{{- "<|eot_id|>" }} + +{#- Custom tools are passed in a user message with some extra guidance #} +{%- if tools_in_user_message and not tools is none %} + {#- Extract the first user message so we can plug it in here #} + {%- if messages | length != 0 %} + {%- set first_user_message = messages[0]['content']|trim %} + {%- set messages = messages[1:] %} + {%- else %} + {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} +{%- endif %} + {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} + {{- "Given the following functions, please respond with a JSON for a function call " }} + {{- "with its proper arguments that best answers the given prompt.\n\n" }} + {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} + {{- "Do not use variables.\n\n" }} + {%- for t in tools %} + {{- t | tojson(indent=4) }} + {{- "\n\n" }} + {%- endfor %} + {{- first_user_message + "<|eot_id|>"}} +{%- endif %} + +{%- for message in messages %} + {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} + {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} + {%- elif 'tool_calls' in message %} + {%- if not message.tool_calls|length == 1 %} + {{- raise_exception("This model only supports single tool-calls at once!") }} + {%- endif %} + {%- set tool_call = message.tool_calls[0].function %} + {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} + {{- '{"name": "' + tool_call.name + '", ' }} + {{- '"parameters": ' }} + {{- tool_call.arguments | tojson }} + {{- "}" }} + {{- "<|eot_id|>" }} + {%- elif message.role == "tool" or message.role == "ipython" %} + {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} + {%- if message.content is mapping or message.content is iterable %} + {{- message.content | tojson }} + {%- else %} + {{- message.content }} + {%- endif %} + {{- "<|eot_id|>" }} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} +{%- endif %} diff --git a/checkpoint_metadata.json b/checkpoint_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7e0256914c558a6ff4f4ebf2aad804b2d80fc974 --- /dev/null +++ b/checkpoint_metadata.json @@ -0,0 +1,6 @@ +{ + "timestamp": "2025-12-28T22:19:36.412661", + "custom_metadata": { + "step": 0 + } +} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cda71419c1f840630e9113b727cd2eb28e5eb6e7 --- /dev/null +++ b/config.json @@ -0,0 +1,151 @@ +{ + "_external_rope_config_kwargs": {}, + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "attn_mechanism": "vanilla", + "backend": null, + "bits": null, + "blocksize_b": 1, + "blocksize_k": 128, + "blocksize_q": 128, + "bos_token_id": 128000, + "decode_attn_mechanism": null, + "dtype": "bfloat16", + "easy_method": "train", + "embd_pdrop": 0.0, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "fcm_max_ratio": -1, + "fcm_min_ratio": -1, + "flash_attention_backward_pass_impl": "triton", + "fsdp_is_ep_bound": true, + "gradient_checkpointing": "", + "gradient_checkpointing_targets": null, + "hardware_abstraction": false, + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "kv_cache_quantization_config": null, + "kv_cache_sharding_sequence_axis_name": "sp", + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "moe_force_xla_gmm": false, + "moe_method": "fused_moe", + "moe_tiling_size_batch": 4, + "moe_tiling_size_dim": 128, + "moe_tiling_size_seqlen": 128, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "number_rep_kv": 1, + "operation_configs": null, + "pallas_k_block_size": 128, + "pallas_m_block_size": 128, + "pallas_n_block_size": 128, + "partition_axis": { + "attention_dim_axis": null, + "attention_kv_dim_axis": null, + "batch_axis": [ + "fsdp", + "dp" + ], + "bias_head_sequence_axis": null, + "bias_key_sequence_axis": null, + "data_parallel_axis": "dp", + "decode_attention_dim_axis": null, + "decode_attention_kv_dim_axis": null, + "decode_batch_axis": [ + "fsdp", + "dp" + ], + "decode_head_axis": "tp", + "decode_key_sequence_axis": "sp", + "decode_kv_head_axis": "tp", + "decode_query_sequence_axis": null, + "expert_axis": "ep", + "expert_gate_axis": null, + "expert_parallel_axis": "ep", + "fully_sharded_data_parallel_axis": "fsdp", + "head_axis": "tp", + "hidden_state_axis": "tp", + "key_sequence_axis": "sp", + "kv_head_axis": "tp", + "mlp_intermediate_axis": "tp", + "query_sequence_axis": "sp", + "sequence_axis": "sp", + "sequence_parallel_axis": "sp", + "tensor_parallel_axis": "tp", + "vocab_axis": "tp" + }, + "platform": null, + "precompute_masks": true, + "pretraining_tp": 1, + "quantization_config": null, + "resid_pdrop": 0.0, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "scan_attention_layers": false, + "scan_layers": false, + "scan_mlp_chunk_size": 1024, + "scan_ring_attention": true, + "sequence_axis_name": "sp", + "sharding_axis_dims": [ + 1, + -1, + 1, + 1, + 1 + ], + "sharding_axis_names": [ + "dp", + "fsdp", + "ep", + "tp", + "sp" + ], + "sharding_dcn_axis_dims": null, + "sp_is_ep_bound": true, + "tie_word_embeddings": true, + "transformers_version": "4.57.3", + "use_cache": true, + "use_expert_tensor_mode": false, + "use_ring_of_experts": false, + "use_scan_mlp": false, + "use_sharded_kv_caching": false, + "use_sharding_constraint": false, + "vocab_size": 128256 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..053ba37d35fa3f4c31eda32128d100783a4d1fa6 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,13 @@ +{ + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.57.3", + "trust_remote_code": false +} diff --git a/model/model/embed_tokens/embedding/.zarray b/model/model/embed_tokens/embedding/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..f1af3c8940238c5aa55c2ac7e3dc10e9f73e19e7 --- /dev/null +++ b/model/model/embed_tokens/embedding/.zarray @@ -0,0 +1 @@ +{"chunks":[32064,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[128256,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/embed_tokens/embedding/0.0 b/model/model/embed_tokens/embedding/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2aca44660f873eadaa4851b1befe2f7dbbfade95 --- /dev/null +++ b/model/model/embed_tokens/embedding/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ea837b38624449d8ab8c668e77176d00703925f32bb438ce913e2222694b7d0 +size 102492789 diff --git a/model/model/embed_tokens/embedding/1.0 b/model/model/embed_tokens/embedding/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..51b191a823d89d2f91b51ea85af4496465f919de --- /dev/null +++ b/model/model/embed_tokens/embedding/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea7ed6da80a63a248ac2481e2b82b88d0a145a41c7fabc254677ca24b09c679 +size 102484784 diff --git a/model/model/embed_tokens/embedding/2.0 b/model/model/embed_tokens/embedding/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..54a3d995abb77ee7a919d206e4c91581dc082939 --- /dev/null +++ b/model/model/embed_tokens/embedding/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbca9f6c5e667388a9e6445b417032c35898a688bcf2ca123a65a21c171bae55 +size 102479657 diff --git a/model/model/embed_tokens/embedding/3.0 b/model/model/embed_tokens/embedding/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8fea406c11f8d93a2bd0b9b45bb4ac4422cdbf97 --- /dev/null +++ b/model/model/embed_tokens/embedding/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a691d334486c9613e348a52dd956ed7ef644ecbe32c09c6305f4f5df54889c6 +size 101688512 diff --git a/model/model/layers/0/input_layernorm/kernel/.zarray b/model/model/layers/0/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/0/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/input_layernorm/kernel/0 b/model/model/layers/0/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..7c747809e6131385fabc063376ebb61a87f3ad82 Binary files /dev/null and b/model/model/layers/0/input_layernorm/kernel/0 differ diff --git a/model/model/layers/0/mlp/down_proj/kernel/.zarray b/model/model/layers/0/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.0 b/model/model/layers/0/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..dd12091ce836cd954a01fb9a488658d302247a6c --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d6a786d98070521e730d218d02ab9a510e3f32bb3800014e7b480f1a9bff656 +size 6527475 diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.1 b/model/model/layers/0/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..e3d8abd41acb16ee8e1e900d5a5bd6cf5d6c9f62 --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af4228604a0048ccad8da87f67951727acc054aa6e8f8973c5dd77c7b46bde0 +size 6528474 diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.2 b/model/model/layers/0/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..2d35ae5518ccb5ffe307053ab8e9591c02a8cdda --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154596ecb52b421450500626ef1bdc563dcf1420a98a62e0267d08006d365f61 +size 6526280 diff --git a/model/model/layers/0/mlp/down_proj/kernel/0.3 b/model/model/layers/0/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..071e726b61f7c78732d59c7b01baf9f6981f1e0e --- /dev/null +++ b/model/model/layers/0/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e033eed0a285e527d0aaaac87f285714c37269f3ab4615b490b0cfd81902bc0 +size 6527877 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/.zarray b/model/model/layers/0/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/mlp/gate_proj/kernel/0.0 b/model/model/layers/0/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e0cdf56a13c33e3ec17c191c354c7bf45005f64 --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b405be1611368b2f7f889e59b732ff785be445e4c9ccead5f9057cfe3a19c9 +size 6538934 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/1.0 b/model/model/layers/0/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ca4e50897894028bcf09c5283749764ab6ee383 --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac49d8d1c7bb012db9efd933884fc43c6ed80d378e65e51e120f209f17faaf8 +size 6536157 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/2.0 b/model/model/layers/0/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ed2f98b2b3bafbb91fc00496ff21b2435e358c56 --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cdcabf5db44daca65844a808368306eaec12f04b0813c02d5aa482895c8783b +size 6539230 diff --git a/model/model/layers/0/mlp/gate_proj/kernel/3.0 b/model/model/layers/0/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a08a4064012558ee0104f53806fe7b0957f017ec --- /dev/null +++ b/model/model/layers/0/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b0e654c953a1252780595e72015df465beb137bb455470d62600879b701ab2 +size 6539301 diff --git a/model/model/layers/0/mlp/up_proj/kernel/.zarray b/model/model/layers/0/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/mlp/up_proj/kernel/0.0 b/model/model/layers/0/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e4538e2632fcffde0aeb8f19822caf10bd8f11e --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02bef30fbbae495ea9023edcf1e664187fd7ed8f082897bb07a8a976f8279f90 +size 6529491 diff --git a/model/model/layers/0/mlp/up_proj/kernel/1.0 b/model/model/layers/0/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..281b6ea403d604bb3ebf46188cbb1dcde8ff98d9 --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3df9f3b7ac315d43b19fa301151aea24f39be17b127e1d42605778bbe4b9c782 +size 6526459 diff --git a/model/model/layers/0/mlp/up_proj/kernel/2.0 b/model/model/layers/0/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5760aa8c3afcd833bf510d6434003d7a5d78874c --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe13b34c095a68ed3ca264d915a038cb004703cf9ed41c1dba49430c97665334 +size 6528775 diff --git a/model/model/layers/0/mlp/up_proj/kernel/3.0 b/model/model/layers/0/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d4f2351727420d9941d4442cc7700eff8cdc4f4 --- /dev/null +++ b/model/model/layers/0/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:affeca4f12b92a702938164e824368427b2b75fb1aea3e132858ef9d047ebd33 +size 6530095 diff --git a/model/model/layers/0/post_attention_layernorm/kernel/.zarray b/model/model/layers/0/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/0/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/post_attention_layernorm/kernel/0 b/model/model/layers/0/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f62a825c65f3e53cefbbef607d73298f3590a8ca Binary files /dev/null and b/model/model/layers/0/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/0/self_attn/k_proj/kernel/.zarray b/model/model/layers/0/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/k_proj/kernel/0.0 b/model/model/layers/0/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e7af31503ddd126c2b4902235d7f703f4dd49a00 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e1dc807c3d4bc782822200a7f86cc621324d2d7a21d2db2f1f6e9ee55da179 +size 414402 diff --git a/model/model/layers/0/self_attn/k_proj/kernel/1.0 b/model/model/layers/0/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e200efd545b33c864203d17492242dfdad889ec6 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e33ea14570cb6a35fa6005b9209dddf060c08d043e3ef61222a8ead6ecbde7 +size 414730 diff --git a/model/model/layers/0/self_attn/k_proj/kernel/2.0 b/model/model/layers/0/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..7d6929f4169651f4ca5089ab38d200b4980fe755 --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1210968776a4ac9f29c715939344d6fdd1bc2203412a24211bacf1c8e9cf55b6 +size 415025 diff --git a/model/model/layers/0/self_attn/k_proj/kernel/3.0 b/model/model/layers/0/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f17ca303ef83c43830bd2cba007177e0a9767cb --- /dev/null +++ b/model/model/layers/0/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e24f82d8850f260b0774b46407cf9dab147a6c8771016426baad44caf67482b +size 414790 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/.zarray b/model/model/layers/0/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.0 b/model/model/layers/0/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..afc93177a86b63f63b55ce09e618d473a4507422 --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0597eb782a53d6aa632d27f0516292551b505910d46137a9c43fe347f3318ceb +size 1640502 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.1 b/model/model/layers/0/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..98da736ce0a3c80def8b03614405f92e74e0af2e --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c4e61602a7f16064a205ae526a7f71fc4beae692db92a009593c41bc79b2e0 +size 1639848 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.2 b/model/model/layers/0/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..37699def82724543218b3b819652fc332e37021d --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f5810937dcc2a929f3a01ea51010dc40fa264d3e01f378f1c8a9d7eb61b852 +size 1640166 diff --git a/model/model/layers/0/self_attn/o_proj/kernel/0.3 b/model/model/layers/0/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..50ccde26fbcd186cfd69e14aefa73247e3d532e6 --- /dev/null +++ b/model/model/layers/0/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92f1849f8664e3030868f71bd315e66ad3539b0e9c0ce673d4ec2fbd81d1e7a +size 1640754 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/.zarray b/model/model/layers/0/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/q_proj/kernel/0.0 b/model/model/layers/0/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..25b6fde339ec08846b15c35134269b2f55cb261e --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ab7d3932f1aa9567c15aec0eb8ac8d6e7dc646a6a1ff24617eefdbd23ce5f8 +size 1657678 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/1.0 b/model/model/layers/0/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c275155c1dbc4927cd5e9ac48db9e6bf358bd049 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62aa6fadaf4a3d404d814e283e42ee3c32dd3084a0180f9664bedea574b06f57 +size 1659813 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/2.0 b/model/model/layers/0/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ad6ff43441a7492760a79628cc6fd0a5119324dd --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b4696d98a01c707cafe7aec0652331b9e5ebd4299afcde9d68d0e432deff61 +size 1660245 diff --git a/model/model/layers/0/self_attn/q_proj/kernel/3.0 b/model/model/layers/0/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d23ff6c6a39b5ef75cb9a9f855c490d18cf10d33 --- /dev/null +++ b/model/model/layers/0/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58757a51a3cd976f00417957d1f0820225c56d57235d9d0b16c69d8091340b2a +size 1658737 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/.zarray b/model/model/layers/0/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/0/self_attn/v_proj/kernel/0.0 b/model/model/layers/0/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..cc015ca0915905b07bfdaa3db553f885fc9d3b9a --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0b896e9cda0219ec8e0eda3bea0ec559f601eb43f69de45fd136ccd7b5edc7 +size 414432 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/1.0 b/model/model/layers/0/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f3a67ae069e70ac8b53077474ae23e0e27860805 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93ad4937ab7a65785916562c133808c80436feff8fcb1241f687b0adc01b740 +size 414974 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/2.0 b/model/model/layers/0/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..dc280a643745b1f1e1ec246f42c963fed02a195f --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d6a45031b3b43db3d940b1bbcc37cfffde8b2078db5031be6676ee832abe11 +size 414881 diff --git a/model/model/layers/0/self_attn/v_proj/kernel/3.0 b/model/model/layers/0/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e6f961e4ffd95e2b993903fad19a3931f7702ca6 --- /dev/null +++ b/model/model/layers/0/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d5d34a6a13b2e719073ecafa48558f8572aeb832d6c9cb6559358f5ffa549a +size 414444 diff --git a/model/model/layers/1/input_layernorm/kernel/.zarray b/model/model/layers/1/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/1/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/input_layernorm/kernel/0 b/model/model/layers/1/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ba0a71401e065972e78ff4ed72da7b28799393ad Binary files /dev/null and b/model/model/layers/1/input_layernorm/kernel/0 differ diff --git a/model/model/layers/1/mlp/down_proj/kernel/.zarray b/model/model/layers/1/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.0 b/model/model/layers/1/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a31aae073242b3a81b288ed6df8fa003f5ad7bb3 --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8efad2ea7c423e2c7b09985b2409828a13bf02c004e844ba9701c0c5ebe8fd +size 6528555 diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.1 b/model/model/layers/1/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ce825c6c5dc7fd68594bb566e96bf7a0dc491241 --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c35ebb3e83db526392d889db12380e68a0150a64dd69f4262a95609006f907 +size 6529395 diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.2 b/model/model/layers/1/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d1decc2a5723d0f68959fb0a3a70c6b54c7ed95f --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3936fe4345121f3953635575b3edfad9b21d3916705b1a6798e893ae70e099 +size 6528558 diff --git a/model/model/layers/1/mlp/down_proj/kernel/0.3 b/model/model/layers/1/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e28eb20a7e0a4123a4291c1c6346fd3eced98ce1 --- /dev/null +++ b/model/model/layers/1/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:320679c5c031be8bde05aff4f7192b15e1b1ba51e1e204e9c74c8f248dd389fe +size 6530015 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/.zarray b/model/model/layers/1/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/mlp/gate_proj/kernel/0.0 b/model/model/layers/1/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fcbe12550df4d919d2d0429a4201b4f719bee031 --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:163a6080749b48e290f679dea858f134e8005bdf4c4a5fa27f369836b7db480f +size 6546362 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/1.0 b/model/model/layers/1/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c32ec220488cfe0aaed0c03344f18ab8b3af8e64 --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85592ef117d97b8fdae6da883deeb435c15b2f00c2e33b6662df2c5aa46c2ea +size 6544928 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/2.0 b/model/model/layers/1/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1b2f9fc346a1e9f06d189a5e404fcbeea7242e49 --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61ed6b2cd608b54f91b8819722951c20861da59117dfcb08e6585badfe461e8 +size 6546641 diff --git a/model/model/layers/1/mlp/gate_proj/kernel/3.0 b/model/model/layers/1/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..15a7070be27643968f985eb5082b50a73a13ed6a --- /dev/null +++ b/model/model/layers/1/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e356a8aa890ee5ab10f5ffd20a52a828f259b2e364d40dec3401f7d5f9f617 +size 6546440 diff --git a/model/model/layers/1/mlp/up_proj/kernel/.zarray b/model/model/layers/1/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/mlp/up_proj/kernel/0.0 b/model/model/layers/1/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b5e25db917fa43f93290d6960dd3aa9847805041 --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23513be0ccd58a5ef064b1ee03c87e1a68ccbc982f01fd689d1f8f6a84ec9a4d +size 6530222 diff --git a/model/model/layers/1/mlp/up_proj/kernel/1.0 b/model/model/layers/1/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..24629267ea0fd5c4f3cbb53aa4bc789488bc9325 --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b8a15307a468b1549d944dbf284ee5db1fa775bd49f2fe3d03d7244cd901bd +size 6528567 diff --git a/model/model/layers/1/mlp/up_proj/kernel/2.0 b/model/model/layers/1/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ae3fa7f80731d6dea44d2f1aae33c39202ba599 --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f79ad90ff64b9d21d7f9ba1de44ecbfbd0a7347a866a30bcfb752f226e667f +size 6530437 diff --git a/model/model/layers/1/mlp/up_proj/kernel/3.0 b/model/model/layers/1/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8cad904ea61f4d0f1b12e26740753d0379da6321 --- /dev/null +++ b/model/model/layers/1/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a80491bba3d5e7b9bac94395762770f1da795efb8ebe8618a03c6a9fcdf2ea8a +size 6530924 diff --git a/model/model/layers/1/post_attention_layernorm/kernel/.zarray b/model/model/layers/1/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/1/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/post_attention_layernorm/kernel/0 b/model/model/layers/1/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ab534ce687b55e4cf1f9e60960bd92ec7d387e97 Binary files /dev/null and b/model/model/layers/1/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/1/self_attn/k_proj/kernel/.zarray b/model/model/layers/1/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/k_proj/kernel/0.0 b/model/model/layers/1/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8437f6484faca4518819e1dff1dbf8d98e3801d2 --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7db6baf000337b8471832617f7dbc0032b033160c5f9bd4821ea98da3bdd76 +size 412386 diff --git a/model/model/layers/1/self_attn/k_proj/kernel/1.0 b/model/model/layers/1/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..bc39749a42c882cf195444d69901b85c34a5bd10 --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218840247e6c71c4adca4a21d8d17a8c614c21f4db234c46c20fab4f00c777ce +size 412593 diff --git a/model/model/layers/1/self_attn/k_proj/kernel/2.0 b/model/model/layers/1/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..dd566c1b22e655a99ff033ae72268aa93998aa6a --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddac4762250921c4a4be968d62a11d52d313432f4a36f82775dac7cc172100b5 +size 412485 diff --git a/model/model/layers/1/self_attn/k_proj/kernel/3.0 b/model/model/layers/1/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f443b375e36cc53caa659d0efa091802df3317d --- /dev/null +++ b/model/model/layers/1/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d869fc32e190d121c64e32985a78a6585ea44fcd149455fd324a6926679c0fa3 +size 412311 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/.zarray b/model/model/layers/1/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.0 b/model/model/layers/1/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3bc8cf67d2317727f911d1551762df9ddc77dc4c --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e57d0deafeeb35fcd1108648d91519f55a5f6d288eb92a77464e8d777bd2748 +size 1636014 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.1 b/model/model/layers/1/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..5a2dee247ae4a30ba952c92c76db4c90d760b797 --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb90fc3bdf5dced722ca0e78c2260a2ceaab0aaefca0861030b643be3d2d85ce +size 1635891 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.2 b/model/model/layers/1/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..7e5ac573c2c061f36b18587e2d7c166e5fff0ee6 --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d2acc0d556d2b3ac02d9f771f4a6aae9e7a3fb18bfc099d9eccef0e1e3bbd7c +size 1635296 diff --git a/model/model/layers/1/self_attn/o_proj/kernel/0.3 b/model/model/layers/1/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..5d73dd7897d00dec62459bc3c773bacfa65b7372 --- /dev/null +++ b/model/model/layers/1/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2782e9e93b9de4a7921f67795624f914a6cf04399e62bcd48aec97da16b3d7b3 +size 1636787 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/.zarray b/model/model/layers/1/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/q_proj/kernel/0.0 b/model/model/layers/1/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bd99c5c96574e2fd594c7f4ff0ee2dbb52f53c59 --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c87e20808137c2821f184e4205f02c21d1eba8c44cd69e76dab34bc91565f43 +size 1650776 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/1.0 b/model/model/layers/1/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5a8da709730ad4d6b8049440a19c2f66eba00ac6 --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd662e3062a8032919b3c04411ed6c9cff48ea83bf126286b8d05696fac05e60 +size 1653889 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/2.0 b/model/model/layers/1/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e98195f564ed713c0432e7b6c545abb5198bb57b --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3b51a53c00346727f454fa226c7fee139092fbd9824c8b4c3c7cb5d3b391be +size 1653097 diff --git a/model/model/layers/1/self_attn/q_proj/kernel/3.0 b/model/model/layers/1/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1a4285b5e85d940a0a079baf67cb117eba9e676a --- /dev/null +++ b/model/model/layers/1/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30c6eb51821ad9f4b5c7ac5b2acb8d167de5c7ecc7e8b5e946f1289c3866b7b5 +size 1651822 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/.zarray b/model/model/layers/1/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/1/self_attn/v_proj/kernel/0.0 b/model/model/layers/1/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9200ded32685fa8ad5b2e8c02c2ea30b7362be2a --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:412c61fc49b03a0ef91df713eecc66f4e91d7e20e644dd0d2819d6dc20a91a06 +size 411340 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/1.0 b/model/model/layers/1/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1874fccd294bf0315332d3f76cc7099e284f0d03 --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef8c53b245e8fdc37ba97787febe0380d04cf292d74c195c9ba496654a7096a +size 411919 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/2.0 b/model/model/layers/1/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..784317eb42e0fde1ab3ddcb4e2e655b63a88d4fc --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f7aebbb96f392fe8ec69d3a3cc4ccf36c72abf112c8cc607203ab6fe7647a2 +size 411843 diff --git a/model/model/layers/1/self_attn/v_proj/kernel/3.0 b/model/model/layers/1/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f169e1354a2971c1dd53d8f73ee61975ecae7b2e --- /dev/null +++ b/model/model/layers/1/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b79dd1c73e9806309bd17d0fcc611cdac7dc4f6121876a476106448964cc25 +size 411765 diff --git a/model/model/layers/10/input_layernorm/kernel/.zarray b/model/model/layers/10/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/10/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/input_layernorm/kernel/0 b/model/model/layers/10/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..00fe9bde12e5107bde6990f327daf41a1c7c1c36 Binary files /dev/null and b/model/model/layers/10/input_layernorm/kernel/0 differ diff --git a/model/model/layers/10/mlp/down_proj/kernel/.zarray b/model/model/layers/10/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.0 b/model/model/layers/10/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2154ddd86979210f6aad3b9de0d1707457350051 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ca14976f02348afc55ffefec3c3eb20c40985e00335f0a20fc973535b37c15 +size 6532658 diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.1 b/model/model/layers/10/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..61b9886000d62fe2642eca83750c780650521347 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f622da84d24835f82a7712eda03743618f66d0c3a040d158da51b3894037cc +size 6533073 diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.2 b/model/model/layers/10/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..cc6d9242db46142202ff6e53de398327f4b53fb4 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8219903bb5079c0ace6833f625968b078394367bd2d7e70c4750fbe46d23a418 +size 6531758 diff --git a/model/model/layers/10/mlp/down_proj/kernel/0.3 b/model/model/layers/10/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..63544bb32337e060b2d48b1645e6db07ac59c3d0 --- /dev/null +++ b/model/model/layers/10/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5aada0b505f268dad89b2eee5fbcf0ad43df44fe6be2d5f29bb68e8e8ff7060 +size 6533720 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/.zarray b/model/model/layers/10/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/mlp/gate_proj/kernel/0.0 b/model/model/layers/10/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..96414bcd73b85aace251a009844b9118ee7d1444 --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad8a162f63ff1a7e8dbeb96b62f1a1d839534054ae8eaf325f2d911ba0b698b +size 6561608 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/1.0 b/model/model/layers/10/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e452206cfa2e58291102538b98fdec79d5055818 --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fa482004390407a4d74103988e7add9b2cc435f2db7296bf15cc4e6367e2db +size 6561466 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/2.0 b/model/model/layers/10/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..94fae9987c1bcbb5ceb14a13164d85b28e1c06f4 --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d4650c38229b3ccd20639494ef1562e7c8684e862e114584414a2a1fca36c4c +size 6561467 diff --git a/model/model/layers/10/mlp/gate_proj/kernel/3.0 b/model/model/layers/10/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9b0d7c61232b94a46f4e4c49523b5dc1ce4d113a --- /dev/null +++ b/model/model/layers/10/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e456c8a0b358e1a4bedcf7e1e241407ddae6ee88b8bb358bb5b294e73c821098 +size 6562179 diff --git a/model/model/layers/10/mlp/up_proj/kernel/.zarray b/model/model/layers/10/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/mlp/up_proj/kernel/0.0 b/model/model/layers/10/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3ea816524fa2ae44d566938bde07ac6b83faa4b3 --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb05468d7c1547d0df8aba690a40c7fb9fde3c91cbc6f1a075270d7e9f209e6 +size 6534413 diff --git a/model/model/layers/10/mlp/up_proj/kernel/1.0 b/model/model/layers/10/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5b06e011e8463fb89f054ac704a7539d41ae6eaa --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d02140bc303294044f498ed79f4e1ee01bb0f871594a18de20ee43d477014a +size 6535020 diff --git a/model/model/layers/10/mlp/up_proj/kernel/2.0 b/model/model/layers/10/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8c695d8a8eb1b495a1bdea41358ae45901ebc14b --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a60d3515aebbcd8ebd0a903d429ac2261cb395d7e0638f8ed181b8d701406a0 +size 6534077 diff --git a/model/model/layers/10/mlp/up_proj/kernel/3.0 b/model/model/layers/10/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..697d0765c9249c81ecc3a7b20a41d92935421480 --- /dev/null +++ b/model/model/layers/10/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb34b666852400441ec110b71292be1de4fc69f9ef13710240d4a3ae2430e39b +size 6533543 diff --git a/model/model/layers/10/post_attention_layernorm/kernel/.zarray b/model/model/layers/10/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/10/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/post_attention_layernorm/kernel/0 b/model/model/layers/10/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..e48ab77a1b98a2cd7666aa1e25efe125bc97165b Binary files /dev/null and b/model/model/layers/10/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/10/self_attn/k_proj/kernel/.zarray b/model/model/layers/10/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/k_proj/kernel/0.0 b/model/model/layers/10/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..696e2b2828dd308ae8220989aa258a67029fe3db --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4027befbfa48405c95403519b0c450aad0205481d969e55064d29dd710826bb6 +size 411327 diff --git a/model/model/layers/10/self_attn/k_proj/kernel/1.0 b/model/model/layers/10/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..03e8b66149cd9d0cc7c9db962604665eace248c3 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c18553f171f77e8bbdb8e64d33d609c1406def62b56d5452eba188df0b1d964 +size 411349 diff --git a/model/model/layers/10/self_attn/k_proj/kernel/2.0 b/model/model/layers/10/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..573e2d4a1c1c813e6eefa352e7750a516369f251 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051f364cfba430d085dbcdcf6f6b9bc7c4c924bf1a1c64717860c0dbf4406c68 +size 411351 diff --git a/model/model/layers/10/self_attn/k_proj/kernel/3.0 b/model/model/layers/10/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e51f698af58976018138109f9a776785c54c6de1 --- /dev/null +++ b/model/model/layers/10/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4261c1e1c5de541cbbda28664c7c0938d0c70b8b1d669bb7f3c9ae531d9051 +size 411282 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/.zarray b/model/model/layers/10/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.0 b/model/model/layers/10/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..446417a9d4324d6d09ba5e7087831eb3d6ca5ec3 --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c39c231350f86311dc81e1699e0b17489214879b884e211ef09f9361dd76f093 +size 1635163 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.1 b/model/model/layers/10/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..96b1878e0980e647d764c18ac59469f8c8530e3d --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b41ff8b07160df9dfb42f25cc2283892e328767d6c5e31db5fe6cec2fa3c94b +size 1635072 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.2 b/model/model/layers/10/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..49015cd0ae2cf7af5d870ccccf39cc873b6b108c --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32221919ecd3a1370eaec73499c2b8750905710a3abd1e248422dbce486fed00 +size 1634542 diff --git a/model/model/layers/10/self_attn/o_proj/kernel/0.3 b/model/model/layers/10/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ab85eb9c6f259d2ac94653a9066c2c92c81416b9 --- /dev/null +++ b/model/model/layers/10/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a5ae3557d504d038a30a4584a784615bc1dd93234dc7870fd0dcb4066982cfd +size 1634847 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/.zarray b/model/model/layers/10/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/q_proj/kernel/0.0 b/model/model/layers/10/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d80c1c81b6029793a9273ec8a7042426af93386a --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c37391cb75c31d2cc4ee8d673695b9baf5a76c21bfc23a9b2e9bbf31617308 +size 1655572 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/1.0 b/model/model/layers/10/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..38de3e110967ec6bfe8f0a8d36155331241f2324 --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bce80c023376617ba6ef40bb62e35f768c0cf25b0e803de4446c20c57159537 +size 1655431 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/2.0 b/model/model/layers/10/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1bff31409e3426326c2c9f5d391972cb057f5491 --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:828352640a13d74210d3379eeccacb680772eaf280ae0ab4e9b331407af1372f +size 1654785 diff --git a/model/model/layers/10/self_attn/q_proj/kernel/3.0 b/model/model/layers/10/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c355876455fc44442a922335d48ae0ec8832cf4b --- /dev/null +++ b/model/model/layers/10/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6c0c3daaa08c6ec753e757d093f36f78b76d7c9b888192add456d9b556219a +size 1654791 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/.zarray b/model/model/layers/10/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/10/self_attn/v_proj/kernel/0.0 b/model/model/layers/10/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2baec206f1d75b78393f2c47feabf993b6eb3985 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9800ef970c6b57291560d4f5b3f01f938a557050432cfb607633452d42fad086 +size 409962 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/1.0 b/model/model/layers/10/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..31f4378799072220644e91c970a85b09be4cff84 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359248cf051bb550c98552904ee138fbcb242ca741eadcd328e383b9b9d56c76 +size 409962 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/2.0 b/model/model/layers/10/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..90cd2b481e52b6d9d8895611a8d10b2e2a840b38 --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f89493ff3be4f2b3ce92786c107eca9dc9e4889da627ab3040fa7c9c99f9da8 +size 409900 diff --git a/model/model/layers/10/self_attn/v_proj/kernel/3.0 b/model/model/layers/10/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e7eaa879b1373720db09b9d3f8c111ffa839b5ab --- /dev/null +++ b/model/model/layers/10/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fcf588c140afb1af9dcf6fa35ab93c226d27e7de328744d923f76f1ea1352f +size 409801 diff --git a/model/model/layers/11/input_layernorm/kernel/.zarray b/model/model/layers/11/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/11/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/input_layernorm/kernel/0 b/model/model/layers/11/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..975638d713521b6b0c960cfb42f0fe838d72596c Binary files /dev/null and b/model/model/layers/11/input_layernorm/kernel/0 differ diff --git a/model/model/layers/11/mlp/down_proj/kernel/.zarray b/model/model/layers/11/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.0 b/model/model/layers/11/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0bd30cf1e26580ff4a940cdf63d5af68c3255bc5 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d024a302ba3ceaa05fd38bd97d4a0248b13c56be363ab35bdddbeba437f4cc +size 6534529 diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.1 b/model/model/layers/11/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..31d1bf5c96d19d024e587e1dd40afff87dacb429 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd14adc7e25d8305142cc2faa16cb5dd2232d35d367ede3a2994f0d1a9d01eb2 +size 6535899 diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.2 b/model/model/layers/11/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..739cd5dba093775245eb6f83ed4a28aae476ee71 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:213cd5842a3428bf011a109f9a750d7c6c7ed5017bb94107d0a836f7ed4d9ed0 +size 6534975 diff --git a/model/model/layers/11/mlp/down_proj/kernel/0.3 b/model/model/layers/11/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ce7bb50faafdb4fa79e7faefd885102d40fcedb9 --- /dev/null +++ b/model/model/layers/11/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0b7234e165325009a6e87171da53e68f4301e239ff70c01cdd4c189a73478da +size 6535683 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/.zarray b/model/model/layers/11/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/mlp/gate_proj/kernel/0.0 b/model/model/layers/11/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bce338b293dbb7e3da508c6b6a85f1bdcb0e2f5a --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364cc7a0cb3d5de3317fec8f40d2ddeb611a3a84d457e7c771481cc30d22801a +size 6557184 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/1.0 b/model/model/layers/11/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b9ff837c9f0237ffbe12c09bb3c3e878bd7db1de --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe61a0c27f3c0e2150363a5de6b0095982171120d3671a5eea5ff02919c7781 +size 6557351 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/2.0 b/model/model/layers/11/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5250109fff54e2fc4e1651bff050068b80fcd6b3 --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e7c97488cc98cfa455f671336347390e7ac9f63cd0a1f204df0553a442fc9a +size 6557524 diff --git a/model/model/layers/11/mlp/gate_proj/kernel/3.0 b/model/model/layers/11/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..21e88a727100b9ad078f231135a0709078a3e067 --- /dev/null +++ b/model/model/layers/11/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e36960a661d81e5338c5ec31e0a9b0aecf9773d68ec59020cb64d58843bc43c +size 6557192 diff --git a/model/model/layers/11/mlp/up_proj/kernel/.zarray b/model/model/layers/11/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/mlp/up_proj/kernel/0.0 b/model/model/layers/11/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c931b92036087abf5b1a1637556ed873fb2d4f27 --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db188f2fdcded0bc4dc9ea27ec00d5530dc931e20d9da2a490c61a67dead1e52 +size 6533248 diff --git a/model/model/layers/11/mlp/up_proj/kernel/1.0 b/model/model/layers/11/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..bf23f533993ec5c695b7952d6cf59d16079c3798 --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f251a3720a2c6e1f3a8cb76496d533bfea016794726caa3c43d431c34e0833 +size 6533213 diff --git a/model/model/layers/11/mlp/up_proj/kernel/2.0 b/model/model/layers/11/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..71172d88d4a281e3d2796bfaa663c2c4bd1b1c41 --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4acbcf3b323ce61fb2873563d82098a748d73884a60ae859cc36049b6bf0228 +size 6531957 diff --git a/model/model/layers/11/mlp/up_proj/kernel/3.0 b/model/model/layers/11/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..88b2771aa2b7f7e3545e4ea4a057951f23f2447e --- /dev/null +++ b/model/model/layers/11/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d4f2bb3052c459628070e69c89ad01bdbeeba81a200655d153a22428f627ef +size 6533207 diff --git a/model/model/layers/11/post_attention_layernorm/kernel/.zarray b/model/model/layers/11/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/11/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/post_attention_layernorm/kernel/0 b/model/model/layers/11/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..abe9ae4d27f3be030b253af166e7da85cc4e9c6d Binary files /dev/null and b/model/model/layers/11/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/11/self_attn/k_proj/kernel/.zarray b/model/model/layers/11/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/k_proj/kernel/0.0 b/model/model/layers/11/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..523538c799bd5bde1b552d6298934279e806ec1c --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bdd1edf3d1542f009e222720ce0c58bf0e2f12923ab151ba06176d2125f55ad +size 411155 diff --git a/model/model/layers/11/self_attn/k_proj/kernel/1.0 b/model/model/layers/11/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..66fd2dd38244bda613de58e5b40511368ed671cd --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8715b7f4a3d4e40a61bb31d506608eb17a7f79c59176d7940c6f0ebd81647b10 +size 411235 diff --git a/model/model/layers/11/self_attn/k_proj/kernel/2.0 b/model/model/layers/11/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d7e759b1e577b9199b552653263184e63ef74de7 --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c2bbd55888f220664e9a7e8d0a0c2e714a073181098e55b42caaa6f6d5829e +size 411212 diff --git a/model/model/layers/11/self_attn/k_proj/kernel/3.0 b/model/model/layers/11/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..7b8be59e2a8f7fb579c898f4698e31885a5c044d --- /dev/null +++ b/model/model/layers/11/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff80beff3339e98907e4480dfd16452654536eccfde5af9d727841292e2be7d +size 411128 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/.zarray b/model/model/layers/11/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.0 b/model/model/layers/11/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bc796ce895dfeb89e7aef9334513e6f7d7c5c2bf --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a0fc2cff6597ba6155317b797fa633798a2c9ee6f55949478872aab89b0289 +size 1635483 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.1 b/model/model/layers/11/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..c923ac7c6e480781099db229f9e00b1ae587f077 --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e65d8aca1c12a27624e0e7e94966bf9d44432da11f951f322fd7dc883064c4f +size 1635473 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.2 b/model/model/layers/11/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..48c435a22cc684becc7a3230ff12f6e091337895 --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ad1476ed7852e682ffb428b47fd840f98835d2c2ef08e8435683e55a4279b85 +size 1634988 diff --git a/model/model/layers/11/self_attn/o_proj/kernel/0.3 b/model/model/layers/11/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..22c195496dea8ca4d290414db157640dfe5953df --- /dev/null +++ b/model/model/layers/11/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc3b32fc9eeebc87ad6868b9506f67e070a2f6d19656880c4b816388a4ceb41 +size 1634791 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/.zarray b/model/model/layers/11/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/q_proj/kernel/0.0 b/model/model/layers/11/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1c7a93f859bacba839977c49810d6abe991637c2 --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5482e353ebf4d8cddad174e9485c91738b333017c6a9648b04d01a6d37624b1 +size 1646343 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/1.0 b/model/model/layers/11/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2dc69bd45cc6bb4729e5bb83fa34b9b8a04683fe --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b7de7ca200c464ca2fed57b43a8126f18eb2d5c276b453d1a54af83a16ced0 +size 1646719 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/2.0 b/model/model/layers/11/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1e992ebbf78365cc39748d73966ab2b09c4eb840 --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ea3aafdf48aeffe4168acd8e15e54cc3410a305337302da369f8a49f80ddd7 +size 1646404 diff --git a/model/model/layers/11/self_attn/q_proj/kernel/3.0 b/model/model/layers/11/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9c6ea9f5614e279ac55329384505d91e2aa422df --- /dev/null +++ b/model/model/layers/11/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd038fe916bca86938556838515dece7d8a4a8169c4184f3ed3b904612b2d01 +size 1646412 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/.zarray b/model/model/layers/11/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/11/self_attn/v_proj/kernel/0.0 b/model/model/layers/11/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3219f850ae5635d13da0a18e70a650633d75e8db --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934498e78839d7a146cbf8c6c21ae91313f0f5364c022705e4f7836adf1bb504 +size 409478 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/1.0 b/model/model/layers/11/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e07d76e9d1014622bcf3917d3c32f42e9c082d40 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a21c9a752da92629122fedd34b8829adefda5099c58d083135a80e0fa5318e +size 409640 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/2.0 b/model/model/layers/11/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6d5eb187f4545b482414f7b2c2793f6a2bc3122f --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bacf0af79dc1ddd6e4b22ffc532e2247641f514120f3ce831f026be6d2eab4c8 +size 409373 diff --git a/model/model/layers/11/self_attn/v_proj/kernel/3.0 b/model/model/layers/11/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..72e8d95addb08989383868f470b33cf62b3350c2 --- /dev/null +++ b/model/model/layers/11/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19e0d00254e7439edf0496bc1493650a552168f09e673c09211ef928333e135 +size 409289 diff --git a/model/model/layers/12/input_layernorm/kernel/.zarray b/model/model/layers/12/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/12/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/input_layernorm/kernel/0 b/model/model/layers/12/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..0f3ed206bc6dff531d74a3ac0eb59d31c7c18b69 Binary files /dev/null and b/model/model/layers/12/input_layernorm/kernel/0 differ diff --git a/model/model/layers/12/mlp/down_proj/kernel/.zarray b/model/model/layers/12/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.0 b/model/model/layers/12/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bacc49bd031aa01df8b5a84586fa48f910bb2ab3 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4ca8b58164240e1fcb925503d805c17465e4c83054c083a448d92f82d1e6f2 +size 6540753 diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.1 b/model/model/layers/12/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..126350929b28e24d650eabfa8575aa7180526009 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05d577beb40413da11da516bb59e61278d357c9c58ede4fb52476c794f2fe25 +size 6540944 diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.2 b/model/model/layers/12/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..79d7458d97ef41098f6f88128988793a9bb433c1 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c03dd26c1b6564970fb7446d5bea46d39940b4970a842023a7b00f78d84f00 +size 6540107 diff --git a/model/model/layers/12/mlp/down_proj/kernel/0.3 b/model/model/layers/12/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c0d0ad5fba328325e54148b58455f0c514501b41 --- /dev/null +++ b/model/model/layers/12/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ee97ba6459d5866699b6ce26dbf67f45d43cfb2d12bf506cddb0743180466e +size 6539379 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/.zarray b/model/model/layers/12/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/mlp/gate_proj/kernel/0.0 b/model/model/layers/12/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e6a3b44557cbd04acb25ce99dd1cb9bee926774f --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b6daa23fdf167146c24f55244e5d032556721fb7404bfbae92f237ae67b51af +size 6554270 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/1.0 b/model/model/layers/12/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a98f5b5d61a19a555ca11350196db6fe25b054a --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b75d3a743eb211838867a188665063185ffb49480a1bf0c932e9b29d1ae60d +size 6553577 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/2.0 b/model/model/layers/12/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..dea7068381027c6478ec680bb777b706e6203ddc --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6dc986f1a439500cdfc57c1c45ff17e14c5308199727e41539d3c602a9ec388 +size 6553317 diff --git a/model/model/layers/12/mlp/gate_proj/kernel/3.0 b/model/model/layers/12/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b9be19dc041365ce2cd1c2617e9c0170a55e4755 --- /dev/null +++ b/model/model/layers/12/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f569a59aa3f885a62b3dfd26252c1f7c8d9ee40365618051a3bcde9461abfd5 +size 6553286 diff --git a/model/model/layers/12/mlp/up_proj/kernel/.zarray b/model/model/layers/12/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/mlp/up_proj/kernel/0.0 b/model/model/layers/12/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c7ff02dff95ee83a780fc226733e89335a4347d5 --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d904a9ae5c0b6109cb70724a533001450ec6e2366a198c7e6760896cd9b1ad90 +size 6533572 diff --git a/model/model/layers/12/mlp/up_proj/kernel/1.0 b/model/model/layers/12/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee08bc6b9cc5685d7d09bb783670b25e273b1250 --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45eab20286fcedd97330e9455be9cd997fd9d6dde80deabc63a8295cbdedcbac +size 6534403 diff --git a/model/model/layers/12/mlp/up_proj/kernel/2.0 b/model/model/layers/12/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e9132e9733e1149fd0a972a836cfb3161409289e --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f459e1447f291fc698974d929dab4e630adad35ab03b37e0d24d052c44ffb0a2 +size 6533250 diff --git a/model/model/layers/12/mlp/up_proj/kernel/3.0 b/model/model/layers/12/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f5024aa51e4417ee12d0d891faf9f2d59a659b61 --- /dev/null +++ b/model/model/layers/12/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832317b35a2f06b8dd588d1dfa4d75dc760a29fb891ae0790e3fa14dd4c73ee7 +size 6532894 diff --git a/model/model/layers/12/post_attention_layernorm/kernel/.zarray b/model/model/layers/12/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/12/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/post_attention_layernorm/kernel/0 b/model/model/layers/12/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..22d7c45423bc6d3f4f2500a357ab71318916ef9f Binary files /dev/null and b/model/model/layers/12/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/12/self_attn/k_proj/kernel/.zarray b/model/model/layers/12/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/k_proj/kernel/0.0 b/model/model/layers/12/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ea5cdb2646ea8c87fa9e175cf40a6273d59797a2 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dba6e691c26b32daee15960b2e70c7e4f6d759f043935078e8aa4ab90908711 +size 412352 diff --git a/model/model/layers/12/self_attn/k_proj/kernel/1.0 b/model/model/layers/12/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7bdc92f3dcdeab2e732eebbf8ec0b02af58f479f --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd38b28add6e6f46fd59f2a0c551d2246d396677eae8aaeae5e76f155a31f341 +size 412245 diff --git a/model/model/layers/12/self_attn/k_proj/kernel/2.0 b/model/model/layers/12/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8260b8a149d9e7ce44546ea01d9507bcdd91b79f --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ad099df30d0c9b2888d7e866a8a454e83658406cdb136a196658b7b3a01b2e +size 412349 diff --git a/model/model/layers/12/self_attn/k_proj/kernel/3.0 b/model/model/layers/12/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..37f47d23527cadc6b266950bcef7b1875e017067 --- /dev/null +++ b/model/model/layers/12/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9365917c1039466efd5ff4872d2a76a2fbba4f2ec1c3ca623d9e3fa80d7efd +size 412174 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/.zarray b/model/model/layers/12/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.0 b/model/model/layers/12/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f65675a4f18646f8570f1e9c9472c7e90f5c2523 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39480a0c257472b12aec1ba9471369a3c593ef51f3848f12214a508e37653af8 +size 1636146 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.1 b/model/model/layers/12/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..67d4e4aa9a1cec416b2659dc4e9c5d8f1cdc020b --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6516080878120bc5c9af6ba784cabc599b11fb0bf55f9a3af7bffe865e2a7a58 +size 1636179 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.2 b/model/model/layers/12/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..bb5fdfa81a1333fc3574d2706c370ccf417f71d1 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7166fc34f1438ff424c245a3c6617795bc8d4412c8e245a161650683b3fe263b +size 1635908 diff --git a/model/model/layers/12/self_attn/o_proj/kernel/0.3 b/model/model/layers/12/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e2dd2dc2781a1b672f52da483fb9e12b700aaed6 --- /dev/null +++ b/model/model/layers/12/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dfb08e6bd7e1765fcbdf037ca755579ee5d0d3f247e87cbebdc9734433440db +size 1635685 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/.zarray b/model/model/layers/12/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/q_proj/kernel/0.0 b/model/model/layers/12/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a1e543632056b0ee30b6baf11c736ae81ee59cc7 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baccb923215d0f91f7bb60071d5aac35b391b600c5c003d0b80923fe9357c60b +size 1651697 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/1.0 b/model/model/layers/12/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b61c074698835637d6d907411dcbfcc13ceebe43 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cc1d2c430cb4cbd83d3e14188e734ecf0ad23448888a25c2e2d5c1c658db0c +size 1651820 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/2.0 b/model/model/layers/12/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..02a2ff8926374289f73a9c0752e32f6f75b8b719 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cc6ac6ab836abf72c265fea8658badf1c14f2ec67ac837d44fc7031b8be892b +size 1651667 diff --git a/model/model/layers/12/self_attn/q_proj/kernel/3.0 b/model/model/layers/12/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..122a6740cce5049a3773d1a82f47562b70203f82 --- /dev/null +++ b/model/model/layers/12/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84ef950f9c86c8df8ebb9842287917370744c1a2d9812e523a3e2f8349fb5a1 +size 1651879 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/.zarray b/model/model/layers/12/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/12/self_attn/v_proj/kernel/0.0 b/model/model/layers/12/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a23a856a7f15be4b11fa1007f24f048419c6b96e --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62abc2d632bbac32e03946b55a7ae0e919151ac2feca365cebc7402b14137fdb +size 410521 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/1.0 b/model/model/layers/12/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f1c83a714e829a0ed33a847ddd1664d015cc9f35 --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb341ded3ef61a1e1aec6eacf9c94cc080429d10578c3415abe52f6d9eec56f +size 410697 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/2.0 b/model/model/layers/12/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e08470d4ea81fca4c2ad369f401f0232c9cad4dc --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a14793b5452847ddfa5f4346713fdfb563f831de92ad7abdb8dd80379a432f24 +size 410479 diff --git a/model/model/layers/12/self_attn/v_proj/kernel/3.0 b/model/model/layers/12/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c117440978ce9d594bbeb7876ec39a7ecbe7806f --- /dev/null +++ b/model/model/layers/12/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c772748b771c64ba3e7addd35ccffdc1d9f8c2604c5360e69692cd2fc371abd +size 410448 diff --git a/model/model/layers/13/input_layernorm/kernel/.zarray b/model/model/layers/13/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/13/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/input_layernorm/kernel/0 b/model/model/layers/13/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..87fec3467d41ba4647fb830310fc551544305341 Binary files /dev/null and b/model/model/layers/13/input_layernorm/kernel/0 differ diff --git a/model/model/layers/13/mlp/down_proj/kernel/.zarray b/model/model/layers/13/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.0 b/model/model/layers/13/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f6b2b9981bb8a1d9d4911d786c455c0c07f0a17 --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694cde02a78245e5c9c8cfb26b31b721b19e57e641ab6106ea0973e154a1a243 +size 6543435 diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.1 b/model/model/layers/13/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..9c4412c3c6b5834ce1bc10967db1a3e51e36d068 --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96fe277e536bff32a3aba94658fc3decbb7ddbdb6adb4de9be8d93fdc53e278 +size 6543868 diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.2 b/model/model/layers/13/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..9b3f9eab9ce2692acd0408dd74067b52835a59bd --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc669c9696f813390c0e0ee64affb9136eaf0713c1daba5fd134b07c99af0514 +size 6542850 diff --git a/model/model/layers/13/mlp/down_proj/kernel/0.3 b/model/model/layers/13/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2ce9aa0f4b9072545ede23cf348ce9c69e74ce1b --- /dev/null +++ b/model/model/layers/13/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a8b6c43833fe76926c2bb06bc16d99ca41209017b79baeafd0586824e3edb4 +size 6541761 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/.zarray b/model/model/layers/13/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/mlp/gate_proj/kernel/0.0 b/model/model/layers/13/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..31bd57554fd5f29e571c5c5871bf5b30a0efb3e1 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823cc93f331ac1d086a620b18191de57e8d0d50bd25917f11fe8f4bc2836aa3c +size 6551087 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/1.0 b/model/model/layers/13/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..47e49a36dfdfa7ee55bf3254aebfe7b7afca0e53 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74466ec4d58507a7480d4abd55413f2f802efa8056ff0d4ef22c69624c5c76a +size 6550787 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/2.0 b/model/model/layers/13/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..14503908bdc5d7a7ccce52dd145e5048d28a7803 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56850b56db74bc52bff9039e39c88396ed587d1c7f175a4173e1f367e68f3bd +size 6550536 diff --git a/model/model/layers/13/mlp/gate_proj/kernel/3.0 b/model/model/layers/13/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3e78d9471b71f87b1c5f35d7859e352668cdea99 --- /dev/null +++ b/model/model/layers/13/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f2ed62609e218a838b6f95fddce77fa9db3ca8490befd0386b1320658a48a46 +size 6550679 diff --git a/model/model/layers/13/mlp/up_proj/kernel/.zarray b/model/model/layers/13/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/mlp/up_proj/kernel/0.0 b/model/model/layers/13/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ff26bb7f07a2739251e935e97467f282426cdd99 --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986918f4be91021ca3f555bf0d4e7eed514c53b37c08a25173782448bab80dcd +size 6535638 diff --git a/model/model/layers/13/mlp/up_proj/kernel/1.0 b/model/model/layers/13/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..be0ccd7c8f69cc07732c3eeaaa79f44dc7f2eb4b --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19e7a166fde818e7f4c2ff04b70cdd273eb731c51c359ae91bed251172481c7 +size 6534656 diff --git a/model/model/layers/13/mlp/up_proj/kernel/2.0 b/model/model/layers/13/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..877fcbb366d307bbc723f8d1f6f5ce443c42987d --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e58b814f180183ba9ab9acacf03d9faa4b520a5ea3e638553904de37d00d91b +size 6534844 diff --git a/model/model/layers/13/mlp/up_proj/kernel/3.0 b/model/model/layers/13/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0278d926eb0c148174987f5093659f940123f054 --- /dev/null +++ b/model/model/layers/13/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44172eac947d9b5820a5a12acd0faa7d106c1aeba81fadd13a74073cbfca3935 +size 6534078 diff --git a/model/model/layers/13/post_attention_layernorm/kernel/.zarray b/model/model/layers/13/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/13/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/post_attention_layernorm/kernel/0 b/model/model/layers/13/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..4c586de89629fa1722a155528009ff7ef19662f6 Binary files /dev/null and b/model/model/layers/13/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/13/self_attn/k_proj/kernel/.zarray b/model/model/layers/13/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/k_proj/kernel/0.0 b/model/model/layers/13/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..012fa5e1ca69f440c6155499ff10ed0660d1b052 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a552da3ec51645be4131466455461550994a3b9d39e513bf2cf556e3d666c5b +size 411393 diff --git a/model/model/layers/13/self_attn/k_proj/kernel/1.0 b/model/model/layers/13/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ef08e4a28ea7e73f9f08c36a6673a1e2fef694f9 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daeb1cee00f45392273fced9626fb0f84eafcf0b4dc63ed6b05727182c667945 +size 411594 diff --git a/model/model/layers/13/self_attn/k_proj/kernel/2.0 b/model/model/layers/13/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..99c1361a83eb3235b39d4200dce3d48f38889f3d --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea619e8767237f311da365b5565ba0625be8d37cb70f22a53af9f2f429bc057c +size 411414 diff --git a/model/model/layers/13/self_attn/k_proj/kernel/3.0 b/model/model/layers/13/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..48c2789edad445ac13fd222cd0a7d9fcaacaaf07 --- /dev/null +++ b/model/model/layers/13/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0435f94a71e69518d7ae386e752c3249761c6c5b17b17facbf8c56bb6fa750c8 +size 411317 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/.zarray b/model/model/layers/13/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.0 b/model/model/layers/13/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f38a0100314bdb1d878ae58181eb00dbf27eb9ae --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48ce0d43a10c012b29c4eee9ee33c97ac05169aefa121d6341a7a80ed850d58 +size 1634473 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.1 b/model/model/layers/13/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..49dbf96f1ca424e21897773a5e54a68751ae87e4 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:617526fc797d114015700bc48029112c00dfb70ac9789ab3722a5512390732a2 +size 1634894 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.2 b/model/model/layers/13/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ed6ded4516980e28e028d389ce7107d715d423a7 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb01eca102e889000dae730bbb45d45726e6aa6044a22ddbd9a64a50ae5ba44 +size 1634595 diff --git a/model/model/layers/13/self_attn/o_proj/kernel/0.3 b/model/model/layers/13/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..8588d13527e4ec28090f88098542ce883424a9b4 --- /dev/null +++ b/model/model/layers/13/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:885fc77b34c720d606887c7e20e740eebc32ea6874b321636cfd72f66592cdb5 +size 1634777 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/.zarray b/model/model/layers/13/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/q_proj/kernel/0.0 b/model/model/layers/13/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..985a76e34c9de8ba6bf27b414ed08d999ca19bf6 --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5bc85c7ef7ce63fee3ee4074718024b65fdd43eb698df189b41afdfcdc1fdd2 +size 1650423 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/1.0 b/model/model/layers/13/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a7591e7d15e098dcb4d52736d8112aa5511f34a7 --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4a67c9ab8f1e08d154fef92786b589818f8c0a256f6df6860edd2781e7a75b +size 1650914 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/2.0 b/model/model/layers/13/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..92d6cd962e61de9c5178ac89a38fbaa1cd3cf85b --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28c966c3088b86a097c0d1a5f1bed06665f5e0840c9e7decf1386113761910c +size 1650351 diff --git a/model/model/layers/13/self_attn/q_proj/kernel/3.0 b/model/model/layers/13/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..11a0f9113fa4d3415841dcc4adf023c2f01b133f --- /dev/null +++ b/model/model/layers/13/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:906bb62c70ec1609ebc0538f32a94749d97a7deb511bfbd0549688fef26272ac +size 1650301 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/.zarray b/model/model/layers/13/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/13/self_attn/v_proj/kernel/0.0 b/model/model/layers/13/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1da6f2aea8f01bf109d38ef64b9f7300937ad6c0 --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad198a7966ec539b1a56ca153734ee66998c23f4dee97331afcc47ed1d87f313 +size 410738 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/1.0 b/model/model/layers/13/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0df2facb54a069e1740c9697b1a37cea840a1edd --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d92e5cdde62c57d76b0d9560e974f4de97ead4265c1e86c83470beb94cad656 +size 410759 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/2.0 b/model/model/layers/13/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf2df1802e9b5e7331b2475d4a008c26c1fa0c3e --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0456a383b8fdf217ff3605ac7ae07f4a2c58e74b1fa4ae358d992fd735d93954 +size 410738 diff --git a/model/model/layers/13/self_attn/v_proj/kernel/3.0 b/model/model/layers/13/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ffe10ff5d31c41ddaf6cef4f285d359e55cdde1b --- /dev/null +++ b/model/model/layers/13/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecbcdb7f68359aea30f317f498bc174c90ea7b7ea41c39fc96d6a1114bb6d71 +size 410648 diff --git a/model/model/layers/14/input_layernorm/kernel/.zarray b/model/model/layers/14/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/14/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/input_layernorm/kernel/0 b/model/model/layers/14/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..34271732d416b234a77ca2b65660b8e8c74f84b8 Binary files /dev/null and b/model/model/layers/14/input_layernorm/kernel/0 differ diff --git a/model/model/layers/14/mlp/down_proj/kernel/.zarray b/model/model/layers/14/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.0 b/model/model/layers/14/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..94587974d53b5f123a35043ca15a6af4277f0f63 --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346394a0663eda00187596279f1acb360503fe0ee3c814e810da10e95a1bee7c +size 6544536 diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.1 b/model/model/layers/14/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6d992f0ce457af3ce73c2b1e875f02afe285c127 --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9fe4a11b8bb148e73049b1cc45c61d2b491fee195e9bab8aab96c6b7d325df0 +size 6544446 diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.2 b/model/model/layers/14/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..6dab85256a2bcd38385083c6b50cb6f6dc196a2f --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2834236a95c1a785130f258c42db38fb7b48478b9d9ee3765a0c7d5670f58d8 +size 6544637 diff --git a/model/model/layers/14/mlp/down_proj/kernel/0.3 b/model/model/layers/14/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0129ba3afa9b7f3e0b6290cd77936fe056616c38 --- /dev/null +++ b/model/model/layers/14/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3f28296934b37fb5980321d951ed6b6a0c5909452449a6c8f4d89fe5e2949c +size 6543741 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/.zarray b/model/model/layers/14/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/mlp/gate_proj/kernel/0.0 b/model/model/layers/14/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e09e02f74a6da84423a96eab7ea8dfb8638cdc9d --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd99ae1c3a526b488b4c4a2a5c934e56f6a9eb8f72c495463133540737da84b8 +size 6557182 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/1.0 b/model/model/layers/14/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..87225f86255f93916f5af0be754b5cb790c9cf7f --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803edb5b1efd412f3dd5094e33bba2708c694b4b79b80ddc227a94fc9a3cc028 +size 6556298 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/2.0 b/model/model/layers/14/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3f46dbf962a8bde62208a441b675cd4a65c983b5 --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3af6350c12759618e29ccdd089d7f212fe3e65dc99885daafcc51e1a795cbda +size 6556643 diff --git a/model/model/layers/14/mlp/gate_proj/kernel/3.0 b/model/model/layers/14/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a9c7aa2f63acf9e1e4cd84b15b49f92178c4fcef --- /dev/null +++ b/model/model/layers/14/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5faf380e9270d395724613d1623311eee7bcfac7062a704857abaa9a3de5cca +size 6556549 diff --git a/model/model/layers/14/mlp/up_proj/kernel/.zarray b/model/model/layers/14/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/mlp/up_proj/kernel/0.0 b/model/model/layers/14/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..55c3c8372bfa54f29880107e3c4067c0d9c6971a --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7fe30adbdaf496eb83c1837f1538a5a47e49a6e0a1613f2933491213e210c25 +size 6535788 diff --git a/model/model/layers/14/mlp/up_proj/kernel/1.0 b/model/model/layers/14/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f4c0dfa24be4d40fcfc1b381b7ade1f7d5087de4 --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a21dc29bb93af4866a4ed2fa64010a572a593b918c825005e817f0299c9e31c +size 6535765 diff --git a/model/model/layers/14/mlp/up_proj/kernel/2.0 b/model/model/layers/14/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..06838e25f3bd9f330a447a656756866ff8498ba6 --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50aac7a386752eee07072c2a1c12b725d41cd63d6d1957783040b9e05f79083a +size 6536262 diff --git a/model/model/layers/14/mlp/up_proj/kernel/3.0 b/model/model/layers/14/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..86eee37add4a60d26143c5cbc0591bbdc69e2bcc --- /dev/null +++ b/model/model/layers/14/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e6e4ff5ec3346b3113425c912bf017c0e5d3c0d6974c4595cb87264a5b8160 +size 6536257 diff --git a/model/model/layers/14/post_attention_layernorm/kernel/.zarray b/model/model/layers/14/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/14/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/post_attention_layernorm/kernel/0 b/model/model/layers/14/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..eec6fa23a167f82cc96a085643944aca058d0b71 Binary files /dev/null and b/model/model/layers/14/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/14/self_attn/k_proj/kernel/.zarray b/model/model/layers/14/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/k_proj/kernel/0.0 b/model/model/layers/14/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0e37f49512950793a1a86ff513377c7468027f8c --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24c786f75f4df460966751a5bbbbe7024e507601b40371cfa9541f7f9521e53 +size 412682 diff --git a/model/model/layers/14/self_attn/k_proj/kernel/1.0 b/model/model/layers/14/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b1353f658021ae7aae2ca60a43272655d85426c9 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14af2812466e051e4af14a45d5dc2b2892c68af04f04585c3bef5b22c67d940 +size 412629 diff --git a/model/model/layers/14/self_attn/k_proj/kernel/2.0 b/model/model/layers/14/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6c3989d8cf9c6d4c594c2ef9c52a6304d037fa93 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e16b2fa79f110b4914bb3f5ed989f4f8c258b17b9f80953efc52eb3998f4234f +size 412566 diff --git a/model/model/layers/14/self_attn/k_proj/kernel/3.0 b/model/model/layers/14/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..df2954e4bd75bd1d4731b1eed756238a5c4017c7 --- /dev/null +++ b/model/model/layers/14/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f6b8112293d33beb8142dcb981659d16152d6e397ed1c61cfddc5eb70ccf1c +size 412444 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/.zarray b/model/model/layers/14/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.0 b/model/model/layers/14/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b7c4dc8ae4fb232881c40c8b245769aa6a145d60 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b754a47db0c51991428457d4767261b0d26195e739533b1d6306a507d6e6920f +size 1636649 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.1 b/model/model/layers/14/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..9c5b6f31b087bf9208f23422ca861ac7e8db437f --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f491a8dbf927946d438da91269e5a75337a5e6d8fdbb903efbac234a1023fd +size 1636822 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.2 b/model/model/layers/14/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..1b110abf3675ac0534af32fb19739eae1f355056 --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47faa237815d768e21bd19641fdeb16627d8113bdf8597ff27433849bc93635 +size 1636575 diff --git a/model/model/layers/14/self_attn/o_proj/kernel/0.3 b/model/model/layers/14/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2d51d3572f839f5cbfedc5e657398d7484ff61bb --- /dev/null +++ b/model/model/layers/14/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea87b07c770d980b8e4846767c6d607f8beb829d2b3772dfe109cb75270ca6c3 +size 1636962 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/.zarray b/model/model/layers/14/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/q_proj/kernel/0.0 b/model/model/layers/14/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..16134e8427beea6cbd922158ea03919df87999ed --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe13c16297354742749e978aa119a4665a4ca6c9432f72ea973994611d4face +size 1654082 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/1.0 b/model/model/layers/14/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..02f0821c3d50d6a75c213ee09f9c506f7c4fd3e6 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e52c11ee8cddf38d8e72b09bf88aaf5d0b9ca86e6082331fc5820ef3c0098f +size 1654087 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/2.0 b/model/model/layers/14/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..96007f13d7159fba83bc3de253238ead69c44784 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a631861e5f292889da4edb2c0bdd6428be9b29906a4e299d1e91506c1f0503 +size 1654271 diff --git a/model/model/layers/14/self_attn/q_proj/kernel/3.0 b/model/model/layers/14/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9da58824311bc9ace727a1613aa4fc053b9379f8 --- /dev/null +++ b/model/model/layers/14/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738fc61a52f3b5b907766ccb0cbe4bee1bf1c3e26df7cc3b1eabee78a800d3f5 +size 1653774 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/.zarray b/model/model/layers/14/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/14/self_attn/v_proj/kernel/0.0 b/model/model/layers/14/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3738c8fbe9bd0237f8c36ac5d0d3bec76de4e910 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ed4f69bb50103fd43e9f3d75311234039df366fe21c0ff589ca6666aca99c2 +size 411121 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/1.0 b/model/model/layers/14/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b773119dfdb70775aea5cebfcc20b1fd404db76b --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b36ab2821b9fbc0c5ce391816e08f436cfb4385e80443a6f89cd9079dca2b1 +size 411161 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/2.0 b/model/model/layers/14/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3dac1a8b36afd923cab2d05efbb75474a5306850 --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d9cece28b4460aa3a6d5de0f403c521ba5174c684dab8feee6816df5ba6fbf8 +size 410657 diff --git a/model/model/layers/14/self_attn/v_proj/kernel/3.0 b/model/model/layers/14/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5079a62fb88cba085a0be4976ccb723d2743217c --- /dev/null +++ b/model/model/layers/14/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e185ebbfbca13871e83dbb4f1934f7da53c3a7f60215c637a37da36a3a93b5 +size 410791 diff --git a/model/model/layers/15/input_layernorm/kernel/.zarray b/model/model/layers/15/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/15/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/input_layernorm/kernel/0 b/model/model/layers/15/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..32d87f7ecd34657860a22a0c9e2f46a37faa0507 Binary files /dev/null and b/model/model/layers/15/input_layernorm/kernel/0 differ diff --git a/model/model/layers/15/mlp/down_proj/kernel/.zarray b/model/model/layers/15/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.0 b/model/model/layers/15/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6eecb99b72e4e3f0b80b67c56af5b6a064e55171 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f35284e03f75c65edb0980b86772d47aa84a02a19eccb10755984a5b4ba17b2 +size 6547212 diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.1 b/model/model/layers/15/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..f8bbfd71a601dcabc43a35131e40c7a4f5ea4af1 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8740b37afe7b19fc0f6a6391e1b82e3a7307a499b297b2d507823bb463ca1de +size 6548401 diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.2 b/model/model/layers/15/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ac4803158f029491c72fb90f7df078c3de74df39 --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd57d79aa1f0c67db4d62d037b982da133233a31fd4780e385c7a7bacac0b322 +size 6548670 diff --git a/model/model/layers/15/mlp/down_proj/kernel/0.3 b/model/model/layers/15/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c4e8c14af4eb687960c45c8b30a5a9573b2e975f --- /dev/null +++ b/model/model/layers/15/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e06b72879b862160b18bb4b475c3d00881a9cd63ea4345a28badb8f10a3b2f +size 6547582 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/.zarray b/model/model/layers/15/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/mlp/gate_proj/kernel/0.0 b/model/model/layers/15/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3ff34653058a648e0fbcfd9ab9f68a859fead8db --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37aec808026d50fbddaed63a204e036d484b7d817a64c6c9993fea861c8032f +size 6564184 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/1.0 b/model/model/layers/15/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a88352d578337d70511d988c1cbe898a76a95435 --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a5057acbaed13f99b164d5fa13a307ef9552e68979d2dff1f3e5d6c56e1845 +size 6565183 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/2.0 b/model/model/layers/15/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3fd5c9f88953157e65b7696d6b25618be4ebdb32 --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10465298775c4c8b3aacb24a108497ed9f1f88e8fce3f48184ebedfd61a203dd +size 6564872 diff --git a/model/model/layers/15/mlp/gate_proj/kernel/3.0 b/model/model/layers/15/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec3250a0cd9a57ca5c38eb3ddce5c639923a2f4f --- /dev/null +++ b/model/model/layers/15/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ec72a9b858c84474b90ab9667ccf300d726d750c513ac36524dcdf98cf462cd +size 6565213 diff --git a/model/model/layers/15/mlp/up_proj/kernel/.zarray b/model/model/layers/15/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/mlp/up_proj/kernel/0.0 b/model/model/layers/15/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f3e3aa2386394ef221b46f188cd935b27700b64 --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c671ab5049c86c5a68c4230d0ebec3bed8639003da2e699a9c52aed1191867a7 +size 6542654 diff --git a/model/model/layers/15/mlp/up_proj/kernel/1.0 b/model/model/layers/15/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5b957332d9f543236dd2fbaeb9d154c5dfaa7e4b --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f97f48bf4e4e68b1490d7dd7221acd199631d16a2a4160e148585a9ca7eb009 +size 6543177 diff --git a/model/model/layers/15/mlp/up_proj/kernel/2.0 b/model/model/layers/15/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..991f40b558e59848d43174ab02acb27b4d48e55d --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a260ae285d688260592e8c6a7cd1053913ae0b388960dce43680b0db01f95a +size 6542429 diff --git a/model/model/layers/15/mlp/up_proj/kernel/3.0 b/model/model/layers/15/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..68da3aa2f77c7eab56f335ebee95029470ade988 --- /dev/null +++ b/model/model/layers/15/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a1301ae5da13d60d107c00e14d9fe00d92c8176e7dc9d3c3e589ce173770b9 +size 6543130 diff --git a/model/model/layers/15/post_attention_layernorm/kernel/.zarray b/model/model/layers/15/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/15/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/post_attention_layernorm/kernel/0 b/model/model/layers/15/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..40836420388b770e09f016bf328c8a9a4d629abc Binary files /dev/null and b/model/model/layers/15/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/15/self_attn/k_proj/kernel/.zarray b/model/model/layers/15/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/k_proj/kernel/0.0 b/model/model/layers/15/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8ad4cc4565dfb4c768d79507928b4639355aa3a7 --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5ff0de6f1c7e44b297e8e470cbf956e102de3c46052405800c46351a0de79f +size 412205 diff --git a/model/model/layers/15/self_attn/k_proj/kernel/1.0 b/model/model/layers/15/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3a07687cb38e7984f78106edae79e6d86167da71 --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce685dda2c7779d0bf8d505ca813b8b0839676a1079ddcdf27b7a8289101d6b3 +size 412182 diff --git a/model/model/layers/15/self_attn/k_proj/kernel/2.0 b/model/model/layers/15/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..85a07b8e2b27f3352deb30e10be9484be872aedf --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7a224d92e505f63e4cc6a7ed8bad4646a08e517bfb1dda7db6ab59bce91d72 +size 412144 diff --git a/model/model/layers/15/self_attn/k_proj/kernel/3.0 b/model/model/layers/15/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c3fc3dc426ca58eacad78e048d336a19209c6341 --- /dev/null +++ b/model/model/layers/15/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa0fef13f3286153621cb941646a3c13b9a173bfc4e755fb0aeb4e74cefba398 +size 412151 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/.zarray b/model/model/layers/15/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.0 b/model/model/layers/15/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8f514b18daa737f1ab88d8e721992292099fa345 --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b55e79a8265f1f9574674aa4e034a28c98aefbb3318ea7ad38d3b20443aa99 +size 1639193 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.1 b/model/model/layers/15/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7d173edef1a7e90409c92e8d49fd36cc98ea5d02 --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5bad1c2c501700f4cefdefce2d919045f1709550dab9871d9dbc3e5e2586779 +size 1639667 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.2 b/model/model/layers/15/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..faf7d4dfc215f9f26f78df770c70995af1291742 --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02699579f9870d2f5a5b1bca576eaac3f217c5cf59d81631d7b27961018e67fc +size 1639528 diff --git a/model/model/layers/15/self_attn/o_proj/kernel/0.3 b/model/model/layers/15/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f3b2864e00dce3bbbe6a16171cd211a0c7315c5c --- /dev/null +++ b/model/model/layers/15/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499eb436e585570c36d8c17b5213657a9711431f026974f8870cbd81ea0be7b6 +size 1638961 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/.zarray b/model/model/layers/15/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/q_proj/kernel/0.0 b/model/model/layers/15/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..88146734516d453e31768979b2c65d63587dee7c --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f69d70d364dfe2c4eae23c22965f025e1240f1ed0cf7d5f9a390e4d31ee1066 +size 1657164 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/1.0 b/model/model/layers/15/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..29e865d978cf3b35de8cb33abfa0e303b6ca4033 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b4b320b936dd75dc761516669a37add0c7e34d16f056961b2342e2e213b393 +size 1657479 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/2.0 b/model/model/layers/15/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..311cf3a56802da2c612627152d00432115e6bb93 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd54babfbfe3560c9a7396a330ff964cefe3878973102f566b404a9a87ba5a8 +size 1657400 diff --git a/model/model/layers/15/self_attn/q_proj/kernel/3.0 b/model/model/layers/15/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8f8361931af7db1e544c7c5c17d359bde85331d5 --- /dev/null +++ b/model/model/layers/15/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2fd389d818d01ccb04aceccf08e78888b2fb476faf0dde0cccf54c368900d55 +size 1657269 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/.zarray b/model/model/layers/15/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/15/self_attn/v_proj/kernel/0.0 b/model/model/layers/15/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a64f190ea2d0975f1d210b308ac3a89f3920a6b1 --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136a4018d3f214153c08f0e80274d87856bef8125eb46b4f6bac1aac7e610d72 +size 411015 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/1.0 b/model/model/layers/15/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..945e96729eef77ab9a5e2fa2dbb4c695ee626c5c --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2afd660eb6be6d9b5367debbf98c0d46f8fa4d04110d2216752abd2f1509d7a7 +size 410969 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/2.0 b/model/model/layers/15/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..7dd5e2ffa2c236c12edacfe4204094e653f256ac --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91fc2d665375edbc5a113b68a8450e7302ed1b5c5d653a11a501ee48a67f242 +size 410515 diff --git a/model/model/layers/15/self_attn/v_proj/kernel/3.0 b/model/model/layers/15/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..745bfc97d69b3e58fcb7ec77a43c4356052342c8 --- /dev/null +++ b/model/model/layers/15/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a510fcbce2a88db17c4dc7b790ce0b1f05faec3d689ab52a2dd14011a5be68f1 +size 410896 diff --git a/model/model/layers/2/input_layernorm/kernel/.zarray b/model/model/layers/2/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/2/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/input_layernorm/kernel/0 b/model/model/layers/2/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..7e04aa72422f0c70f6fdc2db6af0c661fc225124 Binary files /dev/null and b/model/model/layers/2/input_layernorm/kernel/0 differ diff --git a/model/model/layers/2/mlp/down_proj/kernel/.zarray b/model/model/layers/2/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.0 b/model/model/layers/2/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d64aa7ff6938a242603b9253004fb880d155e551 --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1cc559a1664b91f8261fbd15698cdcfc77c5afeed2d20aecf797eba26f45d2 +size 6527396 diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.1 b/model/model/layers/2/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7e583ad04dcd9b31bebbec93240c711db129f105 --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f69aaf60aead1d6eae7fcd9c57da4cfd7cdd9268ead1f6107ba1bff5cf1b72f +size 6527544 diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.2 b/model/model/layers/2/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..845328c0f3103c1698258ef6ae4c96da359b7cb1 --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfcd7227cf71d1a91ebac2bfe1fcc055df06fabc93a4e366fca3e676c7d75551 +size 6525539 diff --git a/model/model/layers/2/mlp/down_proj/kernel/0.3 b/model/model/layers/2/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..6a055de447bafbc24e5b18881107071655e864a2 --- /dev/null +++ b/model/model/layers/2/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44190275012bc4f79f243b410a793129ddb5b362b2cb8f74d4337e693ff5f76e +size 6528449 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/.zarray b/model/model/layers/2/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/mlp/gate_proj/kernel/0.0 b/model/model/layers/2/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..df41db43959c5095970f333963dd7c0558e09af4 --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c53a62b6294422c3610798199ae49dc22a930c3a8945787421d752f0ad9c91 +size 6551366 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/1.0 b/model/model/layers/2/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3fc004ecc6adaedac07f8e5e94b4160510f1119a --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f647676595f527d938bdcc6afefb305b4d95dd4e0242d33785025e82cce08d +size 6549718 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/2.0 b/model/model/layers/2/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..bb0518fc01cf6eec649dec58d8529a1f21aadf29 --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9c3cff9d6b201645a00c356193a2580dc08d81252e0749edeee391a5429081 +size 6551235 diff --git a/model/model/layers/2/mlp/gate_proj/kernel/3.0 b/model/model/layers/2/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..343a8649d2ba0e6e135b19dc1981bd79e2dc18f4 --- /dev/null +++ b/model/model/layers/2/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492b312caedc7fc859ec2c515ec011572b1afb66a6977e7711b23e061217b530 +size 6551089 diff --git a/model/model/layers/2/mlp/up_proj/kernel/.zarray b/model/model/layers/2/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/mlp/up_proj/kernel/0.0 b/model/model/layers/2/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..16538a896e7de6489548953ed824cb83ee447e9b --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87429c51b429bc34bff7efeac6d92d3e8b3b896fd48694e6f52509ccda56a814 +size 6525011 diff --git a/model/model/layers/2/mlp/up_proj/kernel/1.0 b/model/model/layers/2/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf5c58791cb71ed678deaaaa89597046fecafd94 --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0466a4029a09f9696b206465ed864625da3218553337c1bb9e0c916f55c164 +size 6525117 diff --git a/model/model/layers/2/mlp/up_proj/kernel/2.0 b/model/model/layers/2/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..eb5124fd9dc47617f737a6d38b551cfc0214b84c --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55ab20934423e2aa5265bc79a2107cfbb02f3644d50e26985076079659a5ff76 +size 6525046 diff --git a/model/model/layers/2/mlp/up_proj/kernel/3.0 b/model/model/layers/2/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ca6aa369c10d83c3c30178b888363519c331e936 --- /dev/null +++ b/model/model/layers/2/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:046e2361a4a893b0560d4ece7ff2bb421c993f79d6748a95d6be0466f7487179 +size 6524765 diff --git a/model/model/layers/2/post_attention_layernorm/kernel/.zarray b/model/model/layers/2/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/2/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/post_attention_layernorm/kernel/0 b/model/model/layers/2/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..964a575090576f6ff2910b24fc19a969bf324e2f Binary files /dev/null and b/model/model/layers/2/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/2/self_attn/k_proj/kernel/.zarray b/model/model/layers/2/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/k_proj/kernel/0.0 b/model/model/layers/2/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f9d59480873d78948d8f4d00e077822056fe8ba3 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aebd48f613fadafc45de638e0929e375078fe5dca1ddc815bd2a20cb1f116c89 +size 411556 diff --git a/model/model/layers/2/self_attn/k_proj/kernel/1.0 b/model/model/layers/2/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..17e28e6d4c5b5abe7615f0bede6190d86f9c0b69 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0df517f0c72d01fc7a80fc5e7ca2e17f77efa395da5155d4315dd292613550 +size 411540 diff --git a/model/model/layers/2/self_attn/k_proj/kernel/2.0 b/model/model/layers/2/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c98320362299a5617ac0db8e41c7a29ab7bcabd0 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424ff7116677a1746e8a3bafb43f4b7b88ad20edcc09e0977e50c794aadf8c7c +size 412063 diff --git a/model/model/layers/2/self_attn/k_proj/kernel/3.0 b/model/model/layers/2/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ed5e52246b3bcd669961f6eedff0b1e0f4ab075 --- /dev/null +++ b/model/model/layers/2/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82616e147cb6fd952ef2e79aba94bb0a6ebf43c1c7756c93ef3f1f6845e53fb0 +size 411644 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/.zarray b/model/model/layers/2/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.0 b/model/model/layers/2/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d62dc39cf928f8b7b9878fd4818dd4788b1c3f63 --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4fa7edd8b3fa4fe5fea6dea069966bc10faa37c3738c30e704262159edb8ad5 +size 1635566 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.1 b/model/model/layers/2/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..c9bccb76be7f394c75faf3eb235646121d68277c --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9188684b93ac8f0a17ee5141379322a3c6e48a884e8937eb036c85643478bad +size 1635910 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.2 b/model/model/layers/2/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..281a55b72034756dc1313607a64883093bdbe42d --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c25a2a4520db33fa359a04b03951b45599389c5045a41ba15583f86079dac9 +size 1634962 diff --git a/model/model/layers/2/self_attn/o_proj/kernel/0.3 b/model/model/layers/2/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..52d6fb22248515410c3cb3c2f588cb34980bc660 --- /dev/null +++ b/model/model/layers/2/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8664e83af6d509e256d8f1d1d46399f9da92809a4c5f934c0575b11d3d21aa16 +size 1635996 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/.zarray b/model/model/layers/2/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/q_proj/kernel/0.0 b/model/model/layers/2/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5df2176080f6597f811ebd00c8d2e44f883a196e --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeab3cc56fb06736eb1e1c7a1a0a11f3619476db9bddb214a4c770ca9bf78e47 +size 1652432 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/1.0 b/model/model/layers/2/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9c996b2785ed8636b7fb85ffbaef25264197d59d --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9de6057fb2337552f1d538cec3b69465b50aa0ec5bf59f460ba2997d6d11d0 +size 1652550 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/2.0 b/model/model/layers/2/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..244693eaaec238ff673d87818b90322ff3b2b4f3 --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d238a89ddff3353c430ad9431445d147f97485d4c89583b49a366e42262b85cc +size 1653603 diff --git a/model/model/layers/2/self_attn/q_proj/kernel/3.0 b/model/model/layers/2/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9d0d656068eed1beb0adce9a4bf7df381c05d0eb --- /dev/null +++ b/model/model/layers/2/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0481db451cb1da78989ba5838303efd53e0a2db5511d4d1535e25e0f800e0819 +size 1653091 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/.zarray b/model/model/layers/2/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/2/self_attn/v_proj/kernel/0.0 b/model/model/layers/2/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5812bdde92062210eb68ef1069d620037555816a --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b287f5c018f4325ddf503095e19e2ee000b2c8f4c746f47ebc0069d033fc8b +size 409535 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/1.0 b/model/model/layers/2/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5fbbdb94f17d69e13d4351556790201b86bd758 --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5190caecada72e260c72274ce622dc93a939c2ef3aa645b9af5db84342d55eef +size 409509 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/2.0 b/model/model/layers/2/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1be8513272b2fa1643a985889ed44075ba32672f --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304a1f762db8be0923fd28387dc500c1f3ee1d89245e724b31ad05d6264c9f89 +size 409814 diff --git a/model/model/layers/2/self_attn/v_proj/kernel/3.0 b/model/model/layers/2/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2548319053e9cad61087f7db39835180d6ba3fb --- /dev/null +++ b/model/model/layers/2/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b73aff74f5da89a262ffa83325d8910bcf51aac46e8b06ab23d4eb0f09ba716d +size 409783 diff --git a/model/model/layers/3/input_layernorm/kernel/.zarray b/model/model/layers/3/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/3/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/input_layernorm/kernel/0 b/model/model/layers/3/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..152510f8c0b6a14f35917c0e6185b06046288679 Binary files /dev/null and b/model/model/layers/3/input_layernorm/kernel/0 differ diff --git a/model/model/layers/3/mlp/down_proj/kernel/.zarray b/model/model/layers/3/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.0 b/model/model/layers/3/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5b4bbc757b2c4125d2a2f96c334fc727ee4d60eb --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fccceb9764f5b7eec93713c4729cfffd912e21eb90f54b43e781f78a5ef16f22 +size 6529201 diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.1 b/model/model/layers/3/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..e0cc9e7ed0359f7528c4f139cbb6d71ee12f2843 --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:352343aef5da3fdd21e003f8a63d1c65784f7d439701d134b025bbe93bafaa9f +size 6530725 diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.2 b/model/model/layers/3/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..30fa8ffc1878e55d8af6d23dc58a47a2c09f2387 --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0faa7a4d2f9a7195d3461862198f3274fef7aba46ccc8e64fe75a35e7e129d7 +size 6526444 diff --git a/model/model/layers/3/mlp/down_proj/kernel/0.3 b/model/model/layers/3/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..911d68e672b657fddd617ccbaf10afc238e24a0c --- /dev/null +++ b/model/model/layers/3/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f0bc04eed9044e27b588a492abc96a8edbc4326f4a8436fad14ac23e4bd933 +size 6530687 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/.zarray b/model/model/layers/3/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/mlp/gate_proj/kernel/0.0 b/model/model/layers/3/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..08b0ff0377ff3e2eab639665961c2da6d1d7485b --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1647640f2f1993a711e56c0135d96a97412459f1adf55a1100bbfba734a704 +size 6567909 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/1.0 b/model/model/layers/3/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d65a597fc4585a8677fd7c9b621177eb88d37cd3 --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73680442f54cdb855c4bcf4b47b9e7a02b744a1606af2e06938822220e114392 +size 6567992 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/2.0 b/model/model/layers/3/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b18474c9dc66bb1bbf1fba223fe067dc6519d5b0 --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86933aef6e675c3c9debc6ee30a9bb826349f5c5da030ed1f45ef9ebb6c63e5a +size 6568130 diff --git a/model/model/layers/3/mlp/gate_proj/kernel/3.0 b/model/model/layers/3/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..877c24f47cd9bb3083fa3b2615991a6d6ce79fdb --- /dev/null +++ b/model/model/layers/3/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca403224dd16de3464f885dafe02ec6e802abdc9f93f164f7a6e7410347509a8 +size 6568366 diff --git a/model/model/layers/3/mlp/up_proj/kernel/.zarray b/model/model/layers/3/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/mlp/up_proj/kernel/0.0 b/model/model/layers/3/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..edb4f25f2b266e18b5c27587aea23adaec06a72f --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0f7d92ec3057bcebab243a1ed64d776399f3d92ff964201c5e4e4e19936311 +size 6525616 diff --git a/model/model/layers/3/mlp/up_proj/kernel/1.0 b/model/model/layers/3/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..738a7d5e9c45c7151c481dec7cc2060a08857406 --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80f9c9e58b05fabe9c8354704552e98513c544835315d20f7f290ba9ba5340bf +size 6524678 diff --git a/model/model/layers/3/mlp/up_proj/kernel/2.0 b/model/model/layers/3/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b771fb13e135d3452ea382079cfde18fa5765932 --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920947d8c6760f38632952cd82753a8fa7fb1633b76058bfc671f2be6645874b +size 6524538 diff --git a/model/model/layers/3/mlp/up_proj/kernel/3.0 b/model/model/layers/3/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac9f0df996d424d46df054f99f1be13d3de9bf73 --- /dev/null +++ b/model/model/layers/3/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc385d3633ab09fcc86923f4677ff639a9ce2df886c2ba50f515bd8b8927b68 +size 6524780 diff --git a/model/model/layers/3/post_attention_layernorm/kernel/.zarray b/model/model/layers/3/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/3/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/post_attention_layernorm/kernel/0 b/model/model/layers/3/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..3b080efa145a00863540f7a471fc2ed5dac2e715 Binary files /dev/null and b/model/model/layers/3/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/3/self_attn/k_proj/kernel/.zarray b/model/model/layers/3/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/k_proj/kernel/0.0 b/model/model/layers/3/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..797efdcb977f2f5d085f8983e5233b4bf215b240 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8de3c18c5ba83ec4d10619dc3996545fe9c40ce533b21449e90f742dccc58f13 +size 411500 diff --git a/model/model/layers/3/self_attn/k_proj/kernel/1.0 b/model/model/layers/3/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0f0b63c1be28108f2ad0de1079dfea04023c8cb2 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c2feefe81dd5d6f7042900249f24559da672588bd696ffefaa150efafb9c4c +size 411424 diff --git a/model/model/layers/3/self_attn/k_proj/kernel/2.0 b/model/model/layers/3/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..cfde7f224dc9304b1132a511e4d95f5256ab3d26 --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff7697998c8f91606ff0f634ace896a6a9a69b4d7596e3a424048c808995d801 +size 411226 diff --git a/model/model/layers/3/self_attn/k_proj/kernel/3.0 b/model/model/layers/3/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5b87272ed8369ceca1b2dea6c634605e7014788b --- /dev/null +++ b/model/model/layers/3/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:112b775161b379d3e53fa5b25b68ab0bbdcacfe2d8155cff3b9d7d91be1225a2 +size 411375 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/.zarray b/model/model/layers/3/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.0 b/model/model/layers/3/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..751cda0cacb751f56572bdeab740a9ef80c75b88 --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fb064d9d1b8d89ead06e80be674308ca4b433d3a40f7847f04e0b8d7aef9a0 +size 1634232 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.1 b/model/model/layers/3/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..2f698962a91059fb76dd9c6c75f98196c0afaf02 --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:209209e1822b79618ce756f17c1e3cee3f996bedc04242d8063e31bb85a6445b +size 1634335 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.2 b/model/model/layers/3/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b19a866050aca190f13a4124775deaa5c24d9d3d --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8a16dfaee2b27af9d072f4bbb2ce777f150224a0f14b27c9ef937f666aee64 +size 1633931 diff --git a/model/model/layers/3/self_attn/o_proj/kernel/0.3 b/model/model/layers/3/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f5a77ef60dba6782d75d550a69cd5d779f62cc2f --- /dev/null +++ b/model/model/layers/3/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d63f64d789462bc28a8bd2008346c5d4b9040f38a328cfeb3ce2ab918e23ecb +size 1634222 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/.zarray b/model/model/layers/3/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/q_proj/kernel/0.0 b/model/model/layers/3/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b06488d1dbc0b2384419e2c449a14f01692e8ddc --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d29a131b34ad0c1faab791b39198546ce5ba7fb4a308c42b1c28a19255ee5e +size 1647355 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/1.0 b/model/model/layers/3/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e67f7448fad9844bb92349a52f045b26d52072d7 --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab478fbe1fb0c09c0b0cb09853a38fef1643488185e80749de7fdb0feaab5524 +size 1646720 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/2.0 b/model/model/layers/3/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..49944a96b5195457074bad77bc72cbebf1461acf --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebbbb40b7ddbae5d46e7dff2d83c6e0e6116ccd5a0fcd2b76b723ee198ce8394 +size 1646956 diff --git a/model/model/layers/3/self_attn/q_proj/kernel/3.0 b/model/model/layers/3/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c115d0bc2c47893f516a991f384d5ed353106047 --- /dev/null +++ b/model/model/layers/3/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306a7ce8d50b409d92949334c1cd272a6238a8ea99b73d79277066712dea35cd +size 1647398 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/.zarray b/model/model/layers/3/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/3/self_attn/v_proj/kernel/0.0 b/model/model/layers/3/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..56d3e394b7e803a29326b4eb9c4a85f1ec2c59fa --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf89b07dc1906d113751960ae5a6e44a119a2e1ecae8ebdc769ac46131399fd7 +size 409604 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/1.0 b/model/model/layers/3/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..637baaec4dce8e854feb9fa5865884fce42bcf55 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78e60a9a68080756ad5bb21171c26fc0d77e0b1914293b2490cb0bc50bf2f90 +size 409524 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/2.0 b/model/model/layers/3/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3d6cac59aff23e26fb6e17918b08648bb93b5fa4 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9072a19de9b9be9e59f54b21c202a772b64d89c63046825bdb9d914fe5ecad5f +size 409655 diff --git a/model/model/layers/3/self_attn/v_proj/kernel/3.0 b/model/model/layers/3/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a9603fc2c8f08092373f6e9b03cf270464b12946 --- /dev/null +++ b/model/model/layers/3/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:497a4483666ae647573876954942d32487b246ddc1cc8efbbce6a3ee95333b4e +size 409669 diff --git a/model/model/layers/4/input_layernorm/kernel/.zarray b/model/model/layers/4/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/4/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/input_layernorm/kernel/0 b/model/model/layers/4/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..fa4716acbe083f8979452f6d296b20d806eed326 Binary files /dev/null and b/model/model/layers/4/input_layernorm/kernel/0 differ diff --git a/model/model/layers/4/mlp/down_proj/kernel/.zarray b/model/model/layers/4/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.0 b/model/model/layers/4/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..569722de97dbc72ea75993c32524aadba280d428 --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f49ce8a65a6876dda314c75a0d13c279f1561513e5bb5e12564f1a86557548 +size 6531675 diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.1 b/model/model/layers/4/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..aeb77e15dd3bbf9997cbfa8868e1f087efb490d8 --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e00e6e381eb92369bfc23ee9bd86a94a8715a56d352aa35634e07ea1a38be2c0 +size 6533436 diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.2 b/model/model/layers/4/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..78fb5a7283bae0fb8843550250aae2f28877815d --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c62e913cb22389d34aacfac513ff59eeaee0964eaea861213144e2334173ee3 +size 6529576 diff --git a/model/model/layers/4/mlp/down_proj/kernel/0.3 b/model/model/layers/4/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f05d41382ec61651fcea46a5f181028351b5297b --- /dev/null +++ b/model/model/layers/4/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7b097a46a0d175a8204b621879c3914c07641186fce1f8bc94aedfd90e310ad +size 6532710 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/.zarray b/model/model/layers/4/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/mlp/gate_proj/kernel/0.0 b/model/model/layers/4/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..426f1e7bedf4eb69e79ef07a2a763be5275329f3 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abebe1335521d2ba419d20e5d4d8f21e5554e99a2a6b4c7314cd05ca6e5746b +size 6576287 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/1.0 b/model/model/layers/4/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f94e20b93a73023119220ed34c5f9bedba7f451 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b20264b9900b1e24ef630d5038662e03047a61746e6328a65e6032abc064e6ce +size 6575744 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/2.0 b/model/model/layers/4/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9f43ee6fd912b9dcac148c5f55b91b1f7bbb165a --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23088481fb077c95fae39fae565db0ee8ba2f554f642c2ed89843138eed7a8fe +size 6575839 diff --git a/model/model/layers/4/mlp/gate_proj/kernel/3.0 b/model/model/layers/4/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b72292d27a7526edd6e9ffec8793ec09a0731418 --- /dev/null +++ b/model/model/layers/4/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:435158793e832066a1f3eb2df2ad6ded1398af37cb4584a8ea058cd4fbeabfac +size 6576550 diff --git a/model/model/layers/4/mlp/up_proj/kernel/.zarray b/model/model/layers/4/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/mlp/up_proj/kernel/0.0 b/model/model/layers/4/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..049e456f0d933fbfbe631ce77cc3fbe02b1edfcc --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f038d5042d0bdc8e36682de1d30cef0b261fbe827e769ca5ee61a9fdcb2bda8 +size 6529759 diff --git a/model/model/layers/4/mlp/up_proj/kernel/1.0 b/model/model/layers/4/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2f65e7500989a9dd9769c19575d4169709cc7e6 --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cdc18486bfdaeb396f0d3a56fd63f39b602f473300949ecc8bbe9dac6a7c220 +size 6529494 diff --git a/model/model/layers/4/mlp/up_proj/kernel/2.0 b/model/model/layers/4/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2fd32afff116ef8c06ae9f90cdae3befcf2e200 --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7432bcccb51b4dffe370ae9d9262ce121b20ac8ef0e8b2c2d8ecf242cb6a408f +size 6528077 diff --git a/model/model/layers/4/mlp/up_proj/kernel/3.0 b/model/model/layers/4/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f37684a812393b2c3da9c4c4821ebd76b7b0a09 --- /dev/null +++ b/model/model/layers/4/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ace11043465e36bef10b38cff7e04b7cb1d4832546732ec6c85d3cee42e256e2 +size 6527221 diff --git a/model/model/layers/4/post_attention_layernorm/kernel/.zarray b/model/model/layers/4/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/4/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/post_attention_layernorm/kernel/0 b/model/model/layers/4/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f877191a1ff0f0e72147cfe085059fb10dbe75ce Binary files /dev/null and b/model/model/layers/4/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/4/self_attn/k_proj/kernel/.zarray b/model/model/layers/4/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/k_proj/kernel/0.0 b/model/model/layers/4/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4aa7f1c390668cff82a44a293338ae123511603b --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799c52c6f1449aa227f57f2222cc59df0a07662baa5853f18e150166a0c8415a +size 411085 diff --git a/model/model/layers/4/self_attn/k_proj/kernel/1.0 b/model/model/layers/4/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a5a9c8ddd7338ed4af626e3ea39e182fd05b47c4 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74610034fd4c705a44ece555b1de0a4cb07d09d3ff775654d2a84a6ed5bedd9d +size 411105 diff --git a/model/model/layers/4/self_attn/k_proj/kernel/2.0 b/model/model/layers/4/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..19b4eff638466c5b39ceb60a451ec708ae055343 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61cb8fcb531ed8ef3c228b1baa64a8ca45921033db69099822e72b0e1053a938 +size 411203 diff --git a/model/model/layers/4/self_attn/k_proj/kernel/3.0 b/model/model/layers/4/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..def7268c2f3f0e2d09e5911a0b14960293e43900 --- /dev/null +++ b/model/model/layers/4/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8bd0af5f3f8c583e1dcc67031b46045607307a58dd59ce15876ea856a938616 +size 411101 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/.zarray b/model/model/layers/4/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.0 b/model/model/layers/4/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab28e41dc621fcaae31df9878806fc8cf0f85bfb --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735333303e05ca6cfd82d9728083a2e3a35170b92c84d8e88bcf5cbe2f00781c +size 1636736 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.1 b/model/model/layers/4/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..e8781ed94edc8efd8baa6971b85ecc4506b1c10a --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305582b53be61e39f877ec504dc6125ffbee9d364f09b34017219cc84ba3c49a +size 1637190 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.2 b/model/model/layers/4/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..28ddfc71c738db795cadcaead23d51bafa6265be --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0c5be1da08162291e76eab9443c1f6474fa9c070770692dc89cde5940235fd +size 1635588 diff --git a/model/model/layers/4/self_attn/o_proj/kernel/0.3 b/model/model/layers/4/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..22ab0b9946cab7f7b8b9a0be4cbd30ed431614b9 --- /dev/null +++ b/model/model/layers/4/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4abef40bed1440cf68fc4498c10959fb83420079057027af214fcf71fe7d47 +size 1636925 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/.zarray b/model/model/layers/4/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/q_proj/kernel/0.0 b/model/model/layers/4/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ea026dfe66cd73d74f0d8683c90eca94471084a9 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec3aaef51721a0a7cac56c020d54091f44a475386e225b8335ba90031b497ac +size 1649224 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/1.0 b/model/model/layers/4/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..91108891edfece3de0272153ebd07124a159c8a7 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9c668e860b69578abe0fae58056ee8dfa4e252120fc0a9c1b114e55fd02a9b +size 1649253 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/2.0 b/model/model/layers/4/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..02aecd87f22a89c5a35cdcd7b0b6921203828e58 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eca35f86af12c8ab45b9f4f432f4bbf5fc96d0b482bcfbc87158a18fca39cdf7 +size 1649012 diff --git a/model/model/layers/4/self_attn/q_proj/kernel/3.0 b/model/model/layers/4/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5e5a9f56a68b5a715593273b64033ac557d96833 --- /dev/null +++ b/model/model/layers/4/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e213f2be74f94d8d18aa5ee96663e7c2ab28c40066ae7409b2deea4775716e4c +size 1649345 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/.zarray b/model/model/layers/4/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/4/self_attn/v_proj/kernel/0.0 b/model/model/layers/4/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..25db6ceb375e444754209aeda7105e04eaab0391 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d044daae2e5647ec72890644c33c757e93c3e73fbeb2510207b5a0f34921feb +size 410169 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/1.0 b/model/model/layers/4/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7f676c25c6836949a84b307918a5501742de2e85 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e0dcc1708a92b69d434147b5fca8794d7723f355446c1e4a7f7ce80ab9fe40 +size 409935 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/2.0 b/model/model/layers/4/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ac3548c610117eb7080d222be5639ff6268dcb0 --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7dab1403af11e561522aaed231146c32bf2c8562268f3efd2516a6ce659b2e9 +size 409930 diff --git a/model/model/layers/4/self_attn/v_proj/kernel/3.0 b/model/model/layers/4/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a1ecab4a38feb879b591a85bb5dbf41a3b7711cd --- /dev/null +++ b/model/model/layers/4/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab40c559418da20019cfa4b5dcc3c3922f020dea3c160e6c681fc46860fdce2 +size 410171 diff --git a/model/model/layers/5/input_layernorm/kernel/.zarray b/model/model/layers/5/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/5/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/input_layernorm/kernel/0 b/model/model/layers/5/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..efbb2e9e8eea6bde9bd12fa055a29d6f00f358ed Binary files /dev/null and b/model/model/layers/5/input_layernorm/kernel/0 differ diff --git a/model/model/layers/5/mlp/down_proj/kernel/.zarray b/model/model/layers/5/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.0 b/model/model/layers/5/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7d0e103ed3981a4065461830138565d66c7a4e79 --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6203225bf14f69e409069fa68bbcccbc0900c8675efd1f8fb84a090a7d3682e +size 6535280 diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.1 b/model/model/layers/5/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..9fc0780982236118702f27326b485e7450883f73 --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416438a7dc14c0cfd4513810260e766a48fa2e6c5f9dafcdca1316defda4bb61 +size 6536516 diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.2 b/model/model/layers/5/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d025b49249b735e6f6c95d307c5fbc882864b004 --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac8eeee2949e61d732cb27bc9b937272be1b291bc43c9ceb8ed9c9495e0748b +size 6532765 diff --git a/model/model/layers/5/mlp/down_proj/kernel/0.3 b/model/model/layers/5/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e146b43bd2ab45e11af14a86243e2ab1a0928917 --- /dev/null +++ b/model/model/layers/5/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f9d0cb2259c460bc1a072b516654baca2d53bd3c0b43b7223c5d6c4a7f58ec +size 6535123 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/.zarray b/model/model/layers/5/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/mlp/gate_proj/kernel/0.0 b/model/model/layers/5/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e737b8047b42d44ab585aaaf986d800be365a1b --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f003039efba528d2796333f3e07894e32e88482c7995f0708aef9bc8bf0e43b6 +size 6567375 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/1.0 b/model/model/layers/5/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1d631650fdc5b1451c5b733b53d9e0763bf653d7 --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdebd06e07b5ceba8e3160596e1bcd4af88ecbee260a7d8d57ef6acb2ae43d69 +size 6567047 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/2.0 b/model/model/layers/5/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f900492542cfd15b89166700bedd0603059542f6 --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a89436bbfcd917b44d9e308c68269d016d5d4438a3a2e17aa251adb4e8191d +size 6567203 diff --git a/model/model/layers/5/mlp/gate_proj/kernel/3.0 b/model/model/layers/5/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..4c091a710a2a8acbfdda41d8cd43d1a5d4291b1b --- /dev/null +++ b/model/model/layers/5/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b0e5d1a44c066b291276db3751e688e0af9ab6519336e75f45a13bc0d9d203 +size 6566583 diff --git a/model/model/layers/5/mlp/up_proj/kernel/.zarray b/model/model/layers/5/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/mlp/up_proj/kernel/0.0 b/model/model/layers/5/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6dd2c0f828337823ccef6bb151b20f63c558a769 --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:188ba93f4194c6c89487e73adcda297d481d6117705fd7602128c7745e18d15f +size 6530287 diff --git a/model/model/layers/5/mlp/up_proj/kernel/1.0 b/model/model/layers/5/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..03400d56efbdd5b6f79c6d2b484191f839b3ce12 --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f507656344f20b9d77e43b93a2d6853bd5224ca34b7f75910ba82021fa5395 +size 6529759 diff --git a/model/model/layers/5/mlp/up_proj/kernel/2.0 b/model/model/layers/5/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..54cc6ec57e0a0ed88060073554d664e7d4c1fb2b --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9209cd0854c23ced3c5ad1f999202b1223f229b11719d7da2d8cbc57137c7643 +size 6528855 diff --git a/model/model/layers/5/mlp/up_proj/kernel/3.0 b/model/model/layers/5/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..074d4577fb2f1105a4dae165ac3dba30e2657a53 --- /dev/null +++ b/model/model/layers/5/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdea432bdd769ad872901ffa2c8b398328970c0d8d012671c2686bb841a9a1c4 +size 6527886 diff --git a/model/model/layers/5/post_attention_layernorm/kernel/.zarray b/model/model/layers/5/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/5/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/post_attention_layernorm/kernel/0 b/model/model/layers/5/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..565dd35420d7da7b1b9080c63ff129ff34ef88c7 Binary files /dev/null and b/model/model/layers/5/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/5/self_attn/k_proj/kernel/.zarray b/model/model/layers/5/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/k_proj/kernel/0.0 b/model/model/layers/5/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5428cbfa3f4974a6d6eafa1fba40c9d655eff8bb --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f41ccea8c065db798ff1ffd99c9d3a4f5cf730983df2969894501b9fd838ed0 +size 411856 diff --git a/model/model/layers/5/self_attn/k_proj/kernel/1.0 b/model/model/layers/5/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe81c9c4d8fec48a456150591632b0517a8f5050 --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c47f30e578e8a997ef6c618e3b30fd5432a027de31b907ad48c3ec215b06be8 +size 411809 diff --git a/model/model/layers/5/self_attn/k_proj/kernel/2.0 b/model/model/layers/5/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..20baef849138c18e3c7b01863321d17c4b9faa45 --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448fdbd7f6258b26899eb8852f5751863c32b2f78daad7eb1f206438eb6def92 +size 411553 diff --git a/model/model/layers/5/self_attn/k_proj/kernel/3.0 b/model/model/layers/5/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..16aa5310828d6472c5bbf51ecaf6a1eaa259d846 --- /dev/null +++ b/model/model/layers/5/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6383a5e55edc074a92db4f14f2001d2527f4bfc679c232c9e13463eed6e7d5f4 +size 411608 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/.zarray b/model/model/layers/5/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.0 b/model/model/layers/5/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c9f0c82a8afed265c2489fd09b46e9a718911d2e --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f05d7ae81d7bb554e43352f8961e6bf5cf74cd7aa4fd68e5f273e3b451ce1401 +size 1636900 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.1 b/model/model/layers/5/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..310354d7694bd7919b02e561afd7903e698224d0 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5ae5a6afaad9f9b1ded81c71577c9a08451940da97f00a6383290ad837942f8 +size 1637511 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.2 b/model/model/layers/5/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..5f51cacd168971d7235875e7e6e14639906d7978 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31de5886245c5455cf811cb161247a020a3024eee207ff458877040a38136cd3 +size 1636081 diff --git a/model/model/layers/5/self_attn/o_proj/kernel/0.3 b/model/model/layers/5/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ff7a31f0d9031724356bdedd43ee2147ac8bdd26 --- /dev/null +++ b/model/model/layers/5/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd84f8360473db1f8a9fe24f2e026894722b594370a7b7cc5a314163b6dc238f +size 1636993 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/.zarray b/model/model/layers/5/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/q_proj/kernel/0.0 b/model/model/layers/5/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d78d67da03b025b35da7cc508b86ae1a65a4b7d0 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69de60fefc754f430843a566fa7d900d91ff8d722c96f948d9869a1861448bd4 +size 1652667 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/1.0 b/model/model/layers/5/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f21eefdfd32a1d1905e133aacb5b5a442525a3ff --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0d2ee0b0a696e479ad54f148840ba3ce7c7152398888e5358b80e9bc0f4d1b +size 1653393 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/2.0 b/model/model/layers/5/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..81db95ef0515bcf3bffe2c85e18405a874d377cc --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc7ae20edce82fa66171711a25be247791ec65426eaa6d8638cad8ca2575324 +size 1652124 diff --git a/model/model/layers/5/self_attn/q_proj/kernel/3.0 b/model/model/layers/5/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9f13d90e233bfede25fb1fc61e5541c5cc055318 --- /dev/null +++ b/model/model/layers/5/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60454114324a7872e2c79aa230d81f8bbe3d2e2dfba0aac626cfb3262531f878 +size 1652702 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/.zarray b/model/model/layers/5/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/5/self_attn/v_proj/kernel/0.0 b/model/model/layers/5/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..cdd6042179e5bda6efe787451f529dbfd3391d36 --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852882e1b66aaf9afbecd41d314cb534c6c6ac158b781fdd01c2e8a43c0e2f97 +size 409837 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/1.0 b/model/model/layers/5/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..de6982ccf2cc9f930616d4add843ab958615ce1e --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5195fb6fd479976c945223cfb85a4ff21c0d8f92e56c3486353169295a3a7198 +size 409814 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/2.0 b/model/model/layers/5/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b9b6ebb5756b0cbde89ce36b77b5f8a39057c631 --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53fc118006f97fe7b84dcd99bbf1c955ebbb509323f733ad10e5e22700de18c6 +size 409605 diff --git a/model/model/layers/5/self_attn/v_proj/kernel/3.0 b/model/model/layers/5/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..72d82efd4780c186d46e62a191aa2f1c230f43c5 --- /dev/null +++ b/model/model/layers/5/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78200bc57a26812504db7025233f4365018739e515f55f33b31b638321a5b283 +size 409578 diff --git a/model/model/layers/6/input_layernorm/kernel/.zarray b/model/model/layers/6/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/6/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/input_layernorm/kernel/0 b/model/model/layers/6/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..f0f836667ed44fcead59b0f5e7d556034debfad7 Binary files /dev/null and b/model/model/layers/6/input_layernorm/kernel/0 differ diff --git a/model/model/layers/6/mlp/down_proj/kernel/.zarray b/model/model/layers/6/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.0 b/model/model/layers/6/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab7faf18a4d07e12993fd813c9b82e9666f90e2d --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1193093022a1c583acc9fd364484be54cd0c1f56926d99916dea2158750b08f +size 6540028 diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.1 b/model/model/layers/6/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..517f6e13c9b34e17090ca16668fbf1d26a9f60c1 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db4d5bb030b7382a4f5f47a31ac074a5c7c9ec031c411237c9676ea96773488 +size 6540563 diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.2 b/model/model/layers/6/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..49abf160be9d00eccecfb9e09f695e4390541633 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97daad03f5236821686fa0bc34f811dfe1dd3fa20f394d081fdcee40e0209a6f +size 6536506 diff --git a/model/model/layers/6/mlp/down_proj/kernel/0.3 b/model/model/layers/6/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2f503f90f167e167f0f6614655ca8d6d0f9e90b5 --- /dev/null +++ b/model/model/layers/6/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c059e809136341d3ec59928c43df9dee6211ac6873a010e2d2f3dea9275f33d3 +size 6539396 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/.zarray b/model/model/layers/6/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/mlp/gate_proj/kernel/0.0 b/model/model/layers/6/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..db79f3e11f9ea7431633b713d409a6df2efc0f29 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee098919e40a9c667d03780801be6fcabe12ba314b684b01545c43c5cb31acb +size 6564378 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/1.0 b/model/model/layers/6/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..77803460a773deb85690449b7c91d223b52d42a8 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b42cb9ab7c1e1dde0634fa030948b903a6ff0dee52a493c7f1571b5f50097f +size 6565312 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/2.0 b/model/model/layers/6/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3832070faf91b63a84b5d10faa7706f8389db46c --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec08c572f802c542c0cbad0cbde313cd25118f81e3aa90c8d88ed0ed0243509 +size 6564864 diff --git a/model/model/layers/6/mlp/gate_proj/kernel/3.0 b/model/model/layers/6/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a13293f7f4b103c4f55598da1440d0bbaa95590 --- /dev/null +++ b/model/model/layers/6/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067eacd2f4244a0af9e6aedaa3ecd658c71cb848f9246d786a6ee63dd6d40273 +size 6564525 diff --git a/model/model/layers/6/mlp/up_proj/kernel/.zarray b/model/model/layers/6/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/mlp/up_proj/kernel/0.0 b/model/model/layers/6/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9207d4f94ee43c554a8b41751b005b3c4d90c175 --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e0e5996cbd44b703045929e5af391ae72ad9088016de8a75c74d174a92782b +size 6531328 diff --git a/model/model/layers/6/mlp/up_proj/kernel/1.0 b/model/model/layers/6/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..dbafcf6e5c10a84e124bd2644c0096f4d62423fd --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93890102a2b59521f6cdcdf3ccf0f6f360b8d6edc015494ef9c4c28a3c8dabee +size 6531237 diff --git a/model/model/layers/6/mlp/up_proj/kernel/2.0 b/model/model/layers/6/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..14250514af572952bdbe3c5c8a4282bc9de6fdff --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3223916e73efa4f0eb825c1069de08f71ea5438c15caca8e4b4807d62cf97596 +size 6530086 diff --git a/model/model/layers/6/mlp/up_proj/kernel/3.0 b/model/model/layers/6/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ad8273f232abdf1bba96c9adcc114b2cb03e367a --- /dev/null +++ b/model/model/layers/6/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59428a905671a3be35a0c03158341b826dc23b19605e8d3eefe0fe771b418cd7 +size 6528899 diff --git a/model/model/layers/6/post_attention_layernorm/kernel/.zarray b/model/model/layers/6/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/6/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/post_attention_layernorm/kernel/0 b/model/model/layers/6/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..24efc76a5aaf78b9301fc1b536d22c4d375ff1b4 Binary files /dev/null and b/model/model/layers/6/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/6/self_attn/k_proj/kernel/.zarray b/model/model/layers/6/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/k_proj/kernel/0.0 b/model/model/layers/6/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c8878de1526b92c806b5fc19fd1ca82779cc8b76 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a2a1c891185410fcd04f8b620121b8e9cc3c170280d17a8fd6b9f5e59553fd +size 412229 diff --git a/model/model/layers/6/self_attn/k_proj/kernel/1.0 b/model/model/layers/6/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0fcfca940f8c2b0937c3215a99c8bfc1be7e4fd0 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a25ac48990477bf590ad726543efd53934678993ee00faf462590ce6c2d6e32 +size 412125 diff --git a/model/model/layers/6/self_attn/k_proj/kernel/2.0 b/model/model/layers/6/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a578172aadc395aa437c091f07aebc75bcca1320 --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f4fff709f06480bee4f988be31c3f156c04e4a9b5cdaa97edba124b24bde90 +size 411987 diff --git a/model/model/layers/6/self_attn/k_proj/kernel/3.0 b/model/model/layers/6/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..51d15a6276c811db97f4b6bf551bb56d2c848bfb --- /dev/null +++ b/model/model/layers/6/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a60d942b0c40fc60c1bfe974c5751122ffe04a7f78358e0d0f79e5428f44c3b +size 412062 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/.zarray b/model/model/layers/6/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.0 b/model/model/layers/6/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e626a2ac3b01bd6b516d79edf853ce7623426b3a --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5388c5f245e976221d1919dc32dfb55d9992c059a3ea20677bffe9ca15919e +size 1637040 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.1 b/model/model/layers/6/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..c03311cd15364dc5942018d10447dc656b4c21e5 --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06660d0496e38cf9f7fddda610ba9a509f222a0686ef47361e76c78e9b69f5f4 +size 1637715 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.2 b/model/model/layers/6/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..aaf4095798a094d42117a730512ad98ceb37a59b --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0f913bcef9dd782e499adf088847cda44dbec7cd86b42dc433ecb582bd476e +size 1636198 diff --git a/model/model/layers/6/self_attn/o_proj/kernel/0.3 b/model/model/layers/6/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..958ef34d7a7b5bbf9e5fa0422197c3a5f55e46e8 --- /dev/null +++ b/model/model/layers/6/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177b8d74c5be0dbecc62da9d652faad22ff7508f4e54cdddc353ab2c8e740ece +size 1636720 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/.zarray b/model/model/layers/6/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/q_proj/kernel/0.0 b/model/model/layers/6/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ee2c32b7fb0c4b5076b1c302d272a6eae452619 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049212ee257b6fbfbd562318ccea18f6976f5a057b1bdc024018b8c98d96d5f1 +size 1647174 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/1.0 b/model/model/layers/6/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..afb12c39a053c28392f5fb154294d68674cc3d82 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fcee2c859ccaff9e7ad2076bb232a9efabe783d76a5c0816610a6de38a982e7 +size 1647344 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/2.0 b/model/model/layers/6/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..658824d90064042408747a102d11e440092acc26 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5208bb858536ecfa0320a527249215bf6a88d0e4d217cd834f85ecb0bcd19e0b +size 1647014 diff --git a/model/model/layers/6/self_attn/q_proj/kernel/3.0 b/model/model/layers/6/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..48d19347c13a0b0b6fa441543cc0378d2099bc49 --- /dev/null +++ b/model/model/layers/6/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b1940caef496fa324398e6d4899ebab439200595beb01f8f94f0bcbcd5363e +size 1647335 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/.zarray b/model/model/layers/6/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/6/self_attn/v_proj/kernel/0.0 b/model/model/layers/6/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee8d6552ddce788665a061eb4d90e66a1196c343 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd08ec0ded8f7ae8e43c2599d09bef8c32213a8faa7c488f08819410130a8efb +size 410507 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/1.0 b/model/model/layers/6/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..da7ada1707a2a92a710633aa9712a0f73e1c8d32 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21aa08b564095faeed3b9448a99f35042c23ffee89760f34a2f494b0e4bdd9b +size 410390 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/2.0 b/model/model/layers/6/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1a0043f208116779cb613039cb8b49059dc77b93 --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e123b79a5b5fa6330135b0fc34f4228132509c933d89f5510c9522e1145aa670 +size 410065 diff --git a/model/model/layers/6/self_attn/v_proj/kernel/3.0 b/model/model/layers/6/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..12bc92d32e84dcb64b3b272a9f637522cfd7fd0d --- /dev/null +++ b/model/model/layers/6/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71da7c73a22f238d334605b1f01e1b72837199e5050414bad0866f3f5003db5c +size 410183 diff --git a/model/model/layers/7/input_layernorm/kernel/.zarray b/model/model/layers/7/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/7/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/input_layernorm/kernel/0 b/model/model/layers/7/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..7af8db70b2da30db908ea56ee4f97853a49f0b22 Binary files /dev/null and b/model/model/layers/7/input_layernorm/kernel/0 differ diff --git a/model/model/layers/7/mlp/down_proj/kernel/.zarray b/model/model/layers/7/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.0 b/model/model/layers/7/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e425b083e36bb1b840eb04e554d378d989c2f8cb --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0464f8ba3d7fa0ffec759f032b4f204d3e9b0afb423d7c3858813efa0bc3f6 +size 6542309 diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.1 b/model/model/layers/7/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..edc2f1d4798ec29dbe8eab66808a50cbe527871d --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1353fe87e94af1143f3a4635b1b0d7e037cc470eee3b1703f853f6eedef72fdd +size 6542829 diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.2 b/model/model/layers/7/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..dfc8e8f12be9883c5f7de1675dc0c3493a99afaa --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57e3a322e438ad794d192b6dfd3f3672c49c023c3731aa4310ca9f91833914e +size 6538981 diff --git a/model/model/layers/7/mlp/down_proj/kernel/0.3 b/model/model/layers/7/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..19c969979cecb02e262800096c9a19d75209fb57 --- /dev/null +++ b/model/model/layers/7/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3006e5615c7e588a8afd05d88f432c72ca766f28282a4d5e34d964a7c01c1ac9 +size 6541469 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/.zarray b/model/model/layers/7/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/mlp/gate_proj/kernel/0.0 b/model/model/layers/7/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..eed56440e11924b390cf93c27839fbe217b7c9b2 --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43fe6eb74908578fa7db8529f7420acf8266741cae0d1136812f7b8e2d26c8ee +size 6566239 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/1.0 b/model/model/layers/7/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..50bef3f5ef7b5f798383adaacfa7efe43673389c --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:898edd550dff475c8b1ae05c1def54a26c67fe63c31bbf7e9ef3f0934374fcf2 +size 6566683 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/2.0 b/model/model/layers/7/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..77f560864f02a9812f1dc9e1dfcbb9a218504b4e --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e179677ee270be337756100e27411315441a386561fbad540f54d4829783ab10 +size 6565637 diff --git a/model/model/layers/7/mlp/gate_proj/kernel/3.0 b/model/model/layers/7/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2f19bafae9a01bdca462fab1f88855fed8377046 --- /dev/null +++ b/model/model/layers/7/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703a8a76ec920cee083bb31faac22eeb69d8bd6517905fbcea1c453157e390af +size 6565745 diff --git a/model/model/layers/7/mlp/up_proj/kernel/.zarray b/model/model/layers/7/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/mlp/up_proj/kernel/0.0 b/model/model/layers/7/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ad6865af0a1c3dcbf1974d9cb090cfc28f3bedc --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e43698b5152532a48d941458dccca7b0f2bd822bacc8dfae5c66f65c189efb9 +size 6535560 diff --git a/model/model/layers/7/mlp/up_proj/kernel/1.0 b/model/model/layers/7/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6694c3c18ef36800b137ec42ef7057d96828aea7 --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5825348092ae0734ed710efe1a7498a343483fb019c4a335c9d06c17764b679 +size 6535768 diff --git a/model/model/layers/7/mlp/up_proj/kernel/2.0 b/model/model/layers/7/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5c840c99b57666ca24e3e320a15f4cb7ea9288eb --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2f11566849d3ab3179d8dc3694bddf4b6db9bba22b4e81345777faa21fbc51 +size 6533742 diff --git a/model/model/layers/7/mlp/up_proj/kernel/3.0 b/model/model/layers/7/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6d1cd4ba5343aba0e6c7eea349cfedeb62b0a473 --- /dev/null +++ b/model/model/layers/7/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9419998eeaad4e06cdd3b5a29bbbabec02edb8ee69855c7e01b4f10b09180c +size 6533869 diff --git a/model/model/layers/7/post_attention_layernorm/kernel/.zarray b/model/model/layers/7/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/7/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/post_attention_layernorm/kernel/0 b/model/model/layers/7/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ac9c107fad92684c9b0017f29a1b840e072c6a38 Binary files /dev/null and b/model/model/layers/7/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/7/self_attn/k_proj/kernel/.zarray b/model/model/layers/7/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/k_proj/kernel/0.0 b/model/model/layers/7/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0bb1d4246354bb4769fcdbd34cefea03a3af8f0b --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdd63a5b26e8e5a48e95beb45ef5a3d2ea90b79a04afb87ed1cf7b34368de05b +size 411770 diff --git a/model/model/layers/7/self_attn/k_proj/kernel/1.0 b/model/model/layers/7/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..664e71f40ff429c0381e9ad65d7d845617d59783 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d0ca70aaf4ad9794b7e9bff1883e802c21416b1d5dd065659826daacc05576 +size 411669 diff --git a/model/model/layers/7/self_attn/k_proj/kernel/2.0 b/model/model/layers/7/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..5e75f5d2ef5c30604fc67113d60d2820eabc16d8 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2ca44ade99317fdc049b5bf0b5d00f7baac539eb0d53eb9bb538e2297a1b38 +size 411803 diff --git a/model/model/layers/7/self_attn/k_proj/kernel/3.0 b/model/model/layers/7/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2fd60d65fa5cd4f64d179ca1b49cb7eef6f826a1 --- /dev/null +++ b/model/model/layers/7/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a766b4a01e1fe271a03f5c7f28c0139a3c248e2f90d0f6e3a55ed982db2ad070 +size 411506 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/.zarray b/model/model/layers/7/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.0 b/model/model/layers/7/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8941a9afc2c293832571de9133c07f1e9504b70a --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99af536be38d82d7fc135b3df236c6e0a379922efd76ee9dcc98b0b131902deb +size 1638186 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.1 b/model/model/layers/7/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..0e4718a8f3856ef26971b8b84473dc10b022b76a --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7b6994c29311b5a4e19b4a272e954288f898d0344059093720f4c49ceb0e226 +size 1638789 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.2 b/model/model/layers/7/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..7f189ba669a4ce412a69891fa48690dbfb1ef01d --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d9635c45f9fe9a134bfc9c224dbfacf011c09d368163c4496f7e5640c97b840 +size 1637585 diff --git a/model/model/layers/7/self_attn/o_proj/kernel/0.3 b/model/model/layers/7/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0990f4d8c4e1400c1cb1ae5caf61a83b28614bc9 --- /dev/null +++ b/model/model/layers/7/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7177ea1b5dce3e9138d1051f6990bc75864fc8464929bc67cc973f1ec5df4b2 +size 1637988 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/.zarray b/model/model/layers/7/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/q_proj/kernel/0.0 b/model/model/layers/7/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..81b9280958c1fc19a6daf6bc8de1085eb2131f29 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11ab2644d7832ec37dca4bee3a9fa5cfa28286581dc61d7def7d49e19077f78 +size 1650017 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/1.0 b/model/model/layers/7/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e73b9acbea812ad92b265dd1ba1c5d6fba0d840 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467183cd2dee769c926a3fcbc48c50072ba732558e7b4d3d4f63e77cdc8ec0db +size 1650702 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/2.0 b/model/model/layers/7/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..120856c13aefa8c6260c8c139753dfd5aaad561e --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170dd152745c6e5191946633e3fdc41cbe52db2d06d4b548335e8f85c2974760 +size 1650665 diff --git a/model/model/layers/7/self_attn/q_proj/kernel/3.0 b/model/model/layers/7/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b89f03c76987b5b293a79681b29c8e7d8ca27ed5 --- /dev/null +++ b/model/model/layers/7/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a216500a526d9b236efd6f49ae52aabbcdc06218549823268a75586dfe2e39 +size 1650058 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/.zarray b/model/model/layers/7/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/7/self_attn/v_proj/kernel/0.0 b/model/model/layers/7/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc50a50eeea6450b05c0ba6e1aab8ef1e33ec953 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7478463646a187b9276cea047a7b38fac05c1748f6e7e2edc6442b842ef0f698 +size 409566 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/1.0 b/model/model/layers/7/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..15618db34775edbd51765f71485d247235b69871 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6763eebb2c33c6a2e0a2e17ceda0ed899a279b31f46e3a32024b03da7c9eb8fd +size 409372 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/2.0 b/model/model/layers/7/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9f247e8abd3a0ea4b7697a70a5205e041b30eee7 --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbfe0484c36d6c57031409f0951095212542d21b70d1506977ca773dca253a7 +size 409479 diff --git a/model/model/layers/7/self_attn/v_proj/kernel/3.0 b/model/model/layers/7/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..63246ec5bb1650440b9013b8eec4d49a35ca9cac --- /dev/null +++ b/model/model/layers/7/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf74281da5b8ecab0bab21102a2e78066d9c2fa57f22484e28088f43ac501c6 +size 409140 diff --git a/model/model/layers/8/input_layernorm/kernel/.zarray b/model/model/layers/8/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/8/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/input_layernorm/kernel/0 b/model/model/layers/8/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..950bdeedcad132f2dcd4f477b46828046e3b5862 Binary files /dev/null and b/model/model/layers/8/input_layernorm/kernel/0 differ diff --git a/model/model/layers/8/mlp/down_proj/kernel/.zarray b/model/model/layers/8/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.0 b/model/model/layers/8/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5a362eef4137420556572ea73904e746adb4b2d9 --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55d76ac92ffe1f08d12223dc7a709c444d940aa61bea5ea7d64a8d77327e86f +size 6537919 diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.1 b/model/model/layers/8/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..2fffd2712483a8a12ddb77f975ad9d9c7b426ae1 --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0f5244d8dad035a6329db9ee9baee84ab638d30a414e4db3cec974ad164b7b0 +size 6537716 diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.2 b/model/model/layers/8/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..af7fd1250ed492df972c217a040bef199115cdb6 --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c82310d6ffe534caf90c3bb6cb111db983086219e4c4013e961c41eb21b5f5 +size 6535030 diff --git a/model/model/layers/8/mlp/down_proj/kernel/0.3 b/model/model/layers/8/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..25c740b0348464b7aa8333d577bf6d22a419e23f --- /dev/null +++ b/model/model/layers/8/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a53d189482fcafc398b667001245a58b3abb5a685d60eaf9742043483862d43 +size 6538423 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/.zarray b/model/model/layers/8/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/mlp/gate_proj/kernel/0.0 b/model/model/layers/8/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..929e21d5364d658e72ded416be7c3047ee0b999d --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8267de86434d93fcbf30ee5a64ac98785882893b2c3d846fd1ddcae9846a10 +size 6560618 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/1.0 b/model/model/layers/8/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..087bd8e4862ef9266e60d1fe7736ed3ed0ab0003 --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e64d83d70a7e87864cd62ae36d45a6f84468a6ee26f4895611fb38981589582 +size 6561146 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/2.0 b/model/model/layers/8/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..7b04d040b01a5c2b350619b01ef80c4391ffa24e --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7c7f331bbfe3e1f1f5a8ce2d05ef3c6dbbb0bde34a2950ec3d3306c0e26bbcb +size 6559367 diff --git a/model/model/layers/8/mlp/gate_proj/kernel/3.0 b/model/model/layers/8/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6e5f42f2c5836dfc3ef956e13824a900037d3835 --- /dev/null +++ b/model/model/layers/8/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d363f22869165034a360b5f1d1c6aa6492d8e62e78c0e4ce0a0876ad1374694 +size 6559908 diff --git a/model/model/layers/8/mlp/up_proj/kernel/.zarray b/model/model/layers/8/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/mlp/up_proj/kernel/0.0 b/model/model/layers/8/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..081a18da285ed42695df62324c29d1ddab4403a0 --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c74687be4b6fd52e3a1aebafd262f5c95daeda990ade4f5077da80cbb1baac +size 6540563 diff --git a/model/model/layers/8/mlp/up_proj/kernel/1.0 b/model/model/layers/8/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7fc75ab2a0f9bbc4b073713c09553ed7560482bf --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f63c142f12320400e085004fb38509e3432cf33fdda25f6e6e95b217eb91373 +size 6540558 diff --git a/model/model/layers/8/mlp/up_proj/kernel/2.0 b/model/model/layers/8/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b86110321e47375486dfba84421c0fca6236a154 --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa7b5ddcca10b4806a972be6a480f332f5fc45e8140f4be35c2216867e84259 +size 6537838 diff --git a/model/model/layers/8/mlp/up_proj/kernel/3.0 b/model/model/layers/8/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cec151e64fb7175c05b401e000e73a99f019a01e --- /dev/null +++ b/model/model/layers/8/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b571b027423803e49018e7ff1c93a33d3eca4c9d2b20f01b7dcae014334e17 +size 6538653 diff --git a/model/model/layers/8/post_attention_layernorm/kernel/.zarray b/model/model/layers/8/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/8/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/post_attention_layernorm/kernel/0 b/model/model/layers/8/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..a4e4152434aec64aeb59a338c2436ebb731d0a44 Binary files /dev/null and b/model/model/layers/8/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/8/self_attn/k_proj/kernel/.zarray b/model/model/layers/8/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/k_proj/kernel/0.0 b/model/model/layers/8/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..38459d2214a16c8910f9fb7a6213bf0a3594f72d --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf11f3e02582314d88992aa974e91dba1830d8f7e78b5a4262fbc3058d6f428 +size 411517 diff --git a/model/model/layers/8/self_attn/k_proj/kernel/1.0 b/model/model/layers/8/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c41cba2b83f7496341725730621d35c7d2380651 --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3976919feefa7299053aa7a6c8598ec385ed80bebe9cacc19c2de7776e625ae4 +size 411833 diff --git a/model/model/layers/8/self_attn/k_proj/kernel/2.0 b/model/model/layers/8/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec35d146835edf05a6929064d007bd1ee775a585 --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df7d02801d742dcb2f89be1791773dd5838e868dd5273df8824ae883ef2de798 +size 411669 diff --git a/model/model/layers/8/self_attn/k_proj/kernel/3.0 b/model/model/layers/8/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d25902989e1c0a5f4937fb3bdd695931558d69a2 --- /dev/null +++ b/model/model/layers/8/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e5963955f95f61901721e8c7d24285f69572929eecbc0368a6dd1e199ac7af +size 411616 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/.zarray b/model/model/layers/8/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.0 b/model/model/layers/8/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b41da27d8c2c3da23846d779a04153d94fddedb5 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a033c7e403bf9e7c02b9269a9ec903efd1701a1b4ec577e0aa1bd7b2f93d15d +size 1638502 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.1 b/model/model/layers/8/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7fb8db059585233c1664629c79fb13edbb597cb5 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a80c0dd5a31d86f9744b6e58a807bdec0377f723f435d6478dd58b8280049ae +size 1638545 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.2 b/model/model/layers/8/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..184b20b3503a125fe8971e660408a3676c20bce2 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c0fb4beb87c8e192be0f1025f59da7966051afcf585249989bcb54e8b22819 +size 1637490 diff --git a/model/model/layers/8/self_attn/o_proj/kernel/0.3 b/model/model/layers/8/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..d6c29105b90d4ba1699f400c283bb7f57a322885 --- /dev/null +++ b/model/model/layers/8/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf6df5fa535aabf7dba4f7ae6852805645dd3769c64167456e3dd7341b4110b3 +size 1638054 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/.zarray b/model/model/layers/8/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/q_proj/kernel/0.0 b/model/model/layers/8/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8dffdcc34c797983f8be90f66445a5a48a056457 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0074060af7583f7f2e19b2639cba0167cd378562ff0f282d02bdcddbdbc81695 +size 1651392 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/1.0 b/model/model/layers/8/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a953df18134c4b3bb261d76c731e978805dcc767 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad5953335b7cc0d8e61f3802a9f2ff2b074ad804ff510b9713b84ed7d64d538 +size 1651448 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/2.0 b/model/model/layers/8/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c07c915e70bf2ec7c657e4753899b87b75889043 --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:198d030b21f5df6f970b5eb1ca446eb91ccc196e0684178ae577e5da0d1cc69a +size 1650593 diff --git a/model/model/layers/8/self_attn/q_proj/kernel/3.0 b/model/model/layers/8/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9123d27e34106fa52da8691dbb1f733c7e0c04ac --- /dev/null +++ b/model/model/layers/8/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53083eca9dabd5e86b7e7a72d7fa7621f9a0fce09b6e16e31098c29cb4801cd3 +size 1650927 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/.zarray b/model/model/layers/8/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/8/self_attn/v_proj/kernel/0.0 b/model/model/layers/8/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..80f7aee5c35cb907f5f8271bd9b2935d5bb98933 --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d77387b85c9ed61e4d185465a05e7000e06f25bb44f29d9407fcef9092191f12 +size 409749 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/1.0 b/model/model/layers/8/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ade09697eed00a8339d9118480493b7055cdc73c --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a721450587828c57a8eacba93e7795ec4005d852fc9f8cc550856c47ef30b532 +size 409730 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/2.0 b/model/model/layers/8/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d08d2ccd3afa95dcb54a93d0253f98fc829a2e8b --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8745b9eefdee0034672b1bfd5c752a97a9830cf77ffcbccda820f192c7c0d874 +size 409609 diff --git a/model/model/layers/8/self_attn/v_proj/kernel/3.0 b/model/model/layers/8/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..340f15a298e61fb1a8bca3710d936cd0dbeec32e --- /dev/null +++ b/model/model/layers/8/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7f14ada0bd7c9e4f28a9ed53eb6f664eaccf5afe82e7ddce2b7eca703b96b0 +size 409458 diff --git a/model/model/layers/9/input_layernorm/kernel/.zarray b/model/model/layers/9/input_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/9/input_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/input_layernorm/kernel/0 b/model/model/layers/9/input_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..01d10e3b359dded948be7e3760d0394688622be2 Binary files /dev/null and b/model/model/layers/9/input_layernorm/kernel/0 differ diff --git a/model/model/layers/9/mlp/down_proj/kernel/.zarray b/model/model/layers/9/mlp/down_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..b57b49d09e50779e6e0a2e2d784feed4998dadab --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[8192,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[8192,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.0 b/model/model/layers/9/mlp/down_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a2b2db0f737f3ceffba59020d91d2d9c57208df4 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dfb077c11f92bbdb1e33cef8f37f1d9d03562bb9837606aa041d91dce3556fc +size 6536370 diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.1 b/model/model/layers/9/mlp/down_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ae83b430ec6fed6bf7a69076c658edf396a576f3 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dabdcf07c680a1c25630bec4cf5df5813d389525b362e88c36bde1eee12b218 +size 6536839 diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.2 b/model/model/layers/9/mlp/down_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b0ef0ace4634e6a4fb56b42bca0466b804437558 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e4be2fe77ba454e6443209106b9576b11f295165b7ecb3bcb94f21b0f5daad +size 6535237 diff --git a/model/model/layers/9/mlp/down_proj/kernel/0.3 b/model/model/layers/9/mlp/down_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..81b9bdc6ccc33a04df5cb1669211cffcd2575351 --- /dev/null +++ b/model/model/layers/9/mlp/down_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183d0078f0af7401264154efec16378899ac25521276dbb6acba214c892c9dc8 +size 6537978 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/.zarray b/model/model/layers/9/mlp/gate_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/mlp/gate_proj/kernel/0.0 b/model/model/layers/9/mlp/gate_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..eefc1f3fdd1c18eebe2eb23b4620c12c73fc36ee --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf8aa4a7ec94a7490e598dd78f6246b13dc4746878b68bf8b700d83fde7fd4b +size 6565178 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/1.0 b/model/model/layers/9/mlp/gate_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d9d83c56217a2936e2c3fd3d22ef6682e6d0ac5e --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15d7a3c3693452cae975834775ae81f81c91b74b4a8adc5d9cae6cd2f0683080 +size 6566066 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/2.0 b/model/model/layers/9/mlp/gate_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..0f6926119e1f644d2b6bae99fed8054f3935b71d --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99213e7db5e9a0e0761106fdecc533024cca64fce0a05fbbcc090c2eb58a9215 +size 6564814 diff --git a/model/model/layers/9/mlp/gate_proj/kernel/3.0 b/model/model/layers/9/mlp/gate_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0092b7d682f065dbae790d0c94c19bc5db3550ef --- /dev/null +++ b/model/model/layers/9/mlp/gate_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b7c235f5028feb6c414ca43380168ea8e94e0e98bca421d45ad4893f257e72 +size 6565601 diff --git a/model/model/layers/9/mlp/up_proj/kernel/.zarray b/model/model/layers/9/mlp/up_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..bfd15e95386293e9aea3e52a5e2e50e7fc8d0d8c --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,8192],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,8192],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/mlp/up_proj/kernel/0.0 b/model/model/layers/9/mlp/up_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..64f83472ee02170a859123cfb75672d156e69348 --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980d1c8492ed898912e163c91982d4e48a3ec44a8e23d032a6c1187812049530 +size 6539311 diff --git a/model/model/layers/9/mlp/up_proj/kernel/1.0 b/model/model/layers/9/mlp/up_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8119563c842b802d43b26cb59cc09d9b84223c5b --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1045f35f64448f0093a1a50f33cc7d0822a68392b6fa516125ed3d5a837120 +size 6539716 diff --git a/model/model/layers/9/mlp/up_proj/kernel/2.0 b/model/model/layers/9/mlp/up_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..78eec34d6c065a7c091f7498899c381976470350 --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78376103b8396d6f3fa403bb026628b46270a62cca9fd185c14fdb7aded85329 +size 6538699 diff --git a/model/model/layers/9/mlp/up_proj/kernel/3.0 b/model/model/layers/9/mlp/up_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..386b824071deea11d2eb0dd54cb75a7a3ba8b698 --- /dev/null +++ b/model/model/layers/9/mlp/up_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c058ead37f3126994bfd539fed511b164b5e5ee79d9f2e4a41570e4be0bcbd94 +size 6539484 diff --git a/model/model/layers/9/post_attention_layernorm/kernel/.zarray b/model/model/layers/9/post_attention_layernorm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/layers/9/post_attention_layernorm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/post_attention_layernorm/kernel/0 b/model/model/layers/9/post_attention_layernorm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..ac71aa30939c8bf8ceeed4de7ac56e3f9bd9fa0c Binary files /dev/null and b/model/model/layers/9/post_attention_layernorm/kernel/0 differ diff --git a/model/model/layers/9/self_attn/k_proj/kernel/.zarray b/model/model/layers/9/self_attn/k_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/k_proj/kernel/0.0 b/model/model/layers/9/self_attn/k_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bee4fe05f9fb8efccd6e459f804d1eea84f84d67 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac889587d6c447c25a55e57dd57410a610dfb52b1b44d887a36810968911cec7 +size 411004 diff --git a/model/model/layers/9/self_attn/k_proj/kernel/1.0 b/model/model/layers/9/self_attn/k_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2cb6143cb971c8f23c11248ccb56296bb52e651e --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dcf07956ec82ca362d848fe594ab0d6c7f66752bba66ebcc8e1dc7e7f14083f +size 411136 diff --git a/model/model/layers/9/self_attn/k_proj/kernel/2.0 b/model/model/layers/9/self_attn/k_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..cb57ce2be166411b9648bf3bbe42b640d5385a96 --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c37325f0a817657970977a0175b36ec22ff5a210a2c41e73c1cc538959ff79 +size 411112 diff --git a/model/model/layers/9/self_attn/k_proj/kernel/3.0 b/model/model/layers/9/self_attn/k_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..adfbd5a8e77d979166356bacfdcff07caae3be9e --- /dev/null +++ b/model/model/layers/9/self_attn/k_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd4449c4c38e60dc5ad72c3cf7571aa05acac91ab1d9263fc461f13e06f5d32 +size 411046 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/.zarray b/model/model/layers/9/self_attn/o_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..1f43215c04ea8738b5721bed11256b14599d4e36 --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.0 b/model/model/layers/9/self_attn/o_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e54edcb188b36bcfda0e7af418cbd0ff739c9d7f --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf994f3cff4673b8d707edc2b61a2c99b95d879222e97400f426ba72104c8065 +size 1636794 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.1 b/model/model/layers/9/self_attn/o_proj/kernel/0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3541c00e4e164c24e3db3f8d23a428dd24b5cd2e --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c46d235a3313e27b19b3f933e6efc99e56d6a64d59ccfd8fd5af605bef367ee +size 1637173 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.2 b/model/model/layers/9/self_attn/o_proj/kernel/0.2 new file mode 100644 index 0000000000000000000000000000000000000000..eb94b97be73bc09485b320467d6071e1756d3bff --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73bfa2364652d5d265af2e72e35c112973ea88e104ec925aa3abffbe758f9b8e +size 1636559 diff --git a/model/model/layers/9/self_attn/o_proj/kernel/0.3 b/model/model/layers/9/self_attn/o_proj/kernel/0.3 new file mode 100644 index 0000000000000000000000000000000000000000..3e2fb865d4bfb2dca8f104ca4e6f15d1ec7fe98c --- /dev/null +++ b/model/model/layers/9/self_attn/o_proj/kernel/0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f407b55d78dfeef97b1e468c93c87482f9b0dc5cc5745771120f5e86a1c389c7 +size 1636581 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/.zarray b/model/model/layers/9/self_attn/q_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..059f1aabbdc9e18d982e2db50174668264fc96e4 --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/q_proj/kernel/0.0 b/model/model/layers/9/self_attn/q_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..dbdfd10dd3f4475927384266cb8aab006d118eb6 --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86f1e75c600dcf11d8c84cf8d0a8622859548c242a8170e322c8642febd90525 +size 1653575 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/1.0 b/model/model/layers/9/self_attn/q_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2fc73b828187e8d95cf81fc3727a696c5f1cbbe9 --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4111533f77822c278186424b75a3bcea4b59f021ebae8a15e965e4c10277304 +size 1653427 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/2.0 b/model/model/layers/9/self_attn/q_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c0ef36b4f094b2d56e37ac20e0dbb621f9d20104 --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0075bd61078b0e26ba026e2a6d33dcd69ed90e6f5aae11e2a9a89ee48739043 +size 1653757 diff --git a/model/model/layers/9/self_attn/q_proj/kernel/3.0 b/model/model/layers/9/self_attn/q_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..64f53f009c0817ce9eb91ffcbd6ff30141936e05 --- /dev/null +++ b/model/model/layers/9/self_attn/q_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382d979493bc9381ba575f612af6c2f3a2e75eda1cfd189e41a90043ba103597 +size 1653232 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/.zarray b/model/model/layers/9/self_attn/v_proj/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..d18ff84a5a6ba43e3384af11d2124c21f026b970 --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[512,512],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048,512],"zarr_format":2} \ No newline at end of file diff --git a/model/model/layers/9/self_attn/v_proj/kernel/0.0 b/model/model/layers/9/self_attn/v_proj/kernel/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4b2ba2448575023365feffa85fb348b31b0fed7c --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76bd9bc58f42ca3aacce82b8ce52f4a8112651b10ef69864e840bce729a8f3e2 +size 409580 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/1.0 b/model/model/layers/9/self_attn/v_proj/kernel/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c662c0d3148c16447b5587bf5869ee37594a4f40 --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3187f1f4438383a35cf1f8705efa249028244e44c4658383e1f26f2559dac9 +size 409458 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/2.0 b/model/model/layers/9/self_attn/v_proj/kernel/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..7228cfb744bfbc0aa24374976758a2500a5a7f84 --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e7d330414d572243e7849a06534f85841a3c51e9dfa3a643c4eaeb159c470b +size 409494 diff --git a/model/model/layers/9/self_attn/v_proj/kernel/3.0 b/model/model/layers/9/self_attn/v_proj/kernel/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..12bae5f5716056c333b9cdfff9ecdcd56094a031 --- /dev/null +++ b/model/model/layers/9/self_attn/v_proj/kernel/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9df2901f290ec73cc185705dd6a4728d3ea7497fddfeb7f30a230a8785c08ff +size 409185 diff --git a/model/model/norm/kernel/.zarray b/model/model/norm/kernel/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..3d403f2b8224d7972b69bca7c2c483d6b3c57b57 --- /dev/null +++ b/model/model/norm/kernel/.zarray @@ -0,0 +1 @@ +{"chunks":[2048],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"bfloat16","fill_value":null,"filters":null,"order":"C","shape":[2048],"zarr_format":2} \ No newline at end of file diff --git a/model/model/norm/kernel/0 b/model/model/norm/kernel/0 new file mode 100644 index 0000000000000000000000000000000000000000..2c73281241aaea1400983208e6f9c9da61a8215c Binary files /dev/null and b/model/model/norm/kernel/0 differ diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..02ee80b6196926a5ad790a004d9efd6ab1ba6542 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,16 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tensorstore_index.json b/tensorstore_index.json new file mode 100644 index 0000000000000000000000000000000000000000..49f291751f5497c0c71853653ccd2371efd7a745 --- /dev/null +++ b/tensorstore_index.json @@ -0,0 +1,1143 @@ +{ + "format": "tensorstore", + "version": "easydel", + "prefixes": { + "model": [ + { + "path": "model/model/embed_tokens/embedding", + "shape": [ + 128256, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/0/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/1/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/10/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/11/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/12/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/13/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/14/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/15/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/2/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/3/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/4/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/5/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/6/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/7/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/8/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/input_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/mlp/down_proj/kernel", + "shape": [ + 8192, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/mlp/gate_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/mlp/up_proj/kernel", + "shape": [ + 2048, + 8192 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/post_attention_layernorm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/k_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/o_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/q_proj/kernel", + "shape": [ + 2048, + 2048 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/layers/9/self_attn/v_proj/kernel", + "shape": [ + 2048, + 512 + ], + "dtype": "bfloat16" + }, + { + "path": "model/model/norm/kernel", + "shape": [ + 2048 + ], + "dtype": "bfloat16" + } + ] + } +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1d8d5c9024994f1d3b00f9662b8dd89ca13cf2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b0c7c141373ca36e5e819a28f60e146ccef652f --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2062 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "tokenizer_class": "PreTrainedTokenizerFast" +}