diff --git a/1b_layer0_mlp.down_proj_output_pretrain_representation.pth b/1b_layer0_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..57118afb4f0167820d8d392df3c351518e9ca1e8 --- /dev/null +++ b/1b_layer0_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4956bfc3dd16fb349d56ce9a47572dc1b873cdfe731cccb36e9dc6b17948f83 +size 66700871 diff --git a/1b_layer0_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer0_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..47f2f4538bbbc94123acd3136f1a7e8e11d161fd --- /dev/null +++ b/1b_layer0_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b9d45e7b26bc101d25f0f4a268c26a7d5a10e3a2466c949fc3e3220403a7b4 +size 66700802 diff --git a/1b_layer0_mlp.up_proj_input_pretrain_representation.pth b/1b_layer0_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bb294106f0a1ddceed4ea52f3a3345b64639d168 --- /dev/null +++ b/1b_layer0_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b76dfb856e4e6ee83c25d98f976bd3057baf8781a8b0fc08e6e88a4f5973833d +size 66700792 diff --git a/1b_layer0_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer0_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d25e00212382c639bc40bb3d92119e87dec9180 --- /dev/null +++ b/1b_layer0_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e217355e366ee4240af1b67c661b7f8f8e25e9738c9bb6c55b2e6b0c97ad739 +size 66700881 diff --git a/1b_layer0_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer0_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..75a515d1de3e4d6744c74d938af7c2a56ef26f01 --- /dev/null +++ b/1b_layer0_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c2d03216822319ca1aeb19b84d2f3b7cfc8b87233461ade3fae5244ffc15b7 +size 16676438 diff --git a/1b_layer0_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer0_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..73719d93654850b29787ca4b8df9bd5d663035d2 --- /dev/null +++ b/1b_layer0_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cdf401fee81f6c648db08b58fec668f8648c32bd871cc6d3747b4ca648af2a6 +size 66700886 diff --git a/1b_layer0_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer0_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee413731e80156f18330b01ccda4394482257366 --- /dev/null +++ b/1b_layer0_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3195544c6b4e3ee81648c2bb84b6767741ff3cfb79aaf5307cdda3076e562f1c +size 66700881 diff --git a/1b_layer0_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer0_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..94d285c06de3d94ba0a8b32cc9afcafbafea3901 --- /dev/null +++ b/1b_layer0_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21bba22a84bd1d4978a833442bdb828cc8aeeda39bccfa1ed49e168d3ac8610a +size 16676438 diff --git a/1b_layer10_mlp.down_proj_output_pretrain_representation.pth b/1b_layer10_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..746089e7890e2f0858ba6715475408a6c410c62a --- /dev/null +++ b/1b_layer10_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91675b45b0a0dacc1c0d26258cbafeedfc644d3ef7ed606b7aeb9cc20f9600fe +size 66700876 diff --git a/1b_layer10_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer10_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a95dce90187f36fc487b5692525879696825eddd --- /dev/null +++ b/1b_layer10_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcc7635e70a61557dc4044f961ae3d0ae2241dfa75010afd0db00ae19794bf1 +size 66700871 diff --git a/1b_layer10_mlp.up_proj_input_pretrain_representation.pth b/1b_layer10_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f630d0b39b7b07f2594505a43c4ac82a0643f1e2 --- /dev/null +++ b/1b_layer10_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb0ca57f8943393552262f9b633f3707d2ad25a1a663f9a2273bd6f453c944e +size 66700797 diff --git a/1b_layer10_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer10_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e4c6bd56b956577b86cda670163c831b2e4435e0 --- /dev/null +++ b/1b_layer10_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f160be22732d812b9fe5c9be6b83b10a9999cc81a82a29193fad09300be9f153 +size 66700886 diff --git a/1b_layer10_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer10_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a031946fa57825fafc501fa6cddd0b82dbb8761 --- /dev/null +++ b/1b_layer10_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ef244a89906e2ccb5e0e42bdcb6ff6b6143eb5e75f16234ab244394b0b7cc8 +size 16676443 diff --git a/1b_layer10_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer10_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..677c1a25be6ba88372c24306ca72e323019d96d1 --- /dev/null +++ b/1b_layer10_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618e336f049c6131862d61607ee88935defa2a4bec51e992ef26b64f08842765 +size 66700891 diff --git a/1b_layer10_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer10_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..464abc3091c758d3245ff7c10bf242a3f04122e6 --- /dev/null +++ b/1b_layer10_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc63f8fecb0a3a8e966b625529ff08c03dbe82a37f7e828f236fd0c943b7181 +size 66700886 diff --git a/1b_layer10_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer10_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e40ccbd1a7b085568c35e2bf7c6cd4e7e87652c --- /dev/null +++ b/1b_layer10_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6dde16c9302c5f55a1b8591180c8cf6b6fa41e6ae5828037347f303b8975093 +size 66700886 diff --git a/1b_layer11_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer11_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..849d242cc552b769532303374491aa8bb2d65460 --- /dev/null +++ b/1b_layer11_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a449273804c779d389415061cb26c29e2a9dfc5d97e13ba66759f7953e50a5 +size 66700871 diff --git a/1b_layer11_mlp.up_proj_input_pretrain_representation.pth b/1b_layer11_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7137aec64d94762b0cdeca30e25790e641ee6ed --- /dev/null +++ b/1b_layer11_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9a9e9d945f6108913dc0242fcb96e47fb5594bb1e120b794c46a253cb3ee9e +size 66700797 diff --git a/1b_layer11_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer11_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f27597a1b007fd2512b7e72fe14b44650b9d1f46 --- /dev/null +++ b/1b_layer11_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:295af11e4c764bd10cab052b25aca2f2c22efff12700a8d909f50588a4336f39 +size 66700886 diff --git a/1b_layer11_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer11_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e7c4fde771209225d8c88e7ad5837bafc8bc492b --- /dev/null +++ b/1b_layer11_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e11d37f51c82e6ed7466674dbba5ef8e8588b9d56cd038069fe6b9c4009a42f +size 66700886 diff --git a/1b_layer11_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer11_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..32e0bc2b4b92f8e1434051d80b90cc9209734dc0 --- /dev/null +++ b/1b_layer11_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420de39b3ffa6b45738c15ee4d90901139955f4791461878e1d346f4a207607a +size 16676443 diff --git a/1b_layer12_mlp.down_proj_output_pretrain_representation.pth b/1b_layer12_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..317528d49b3413dd44ad7c67167833bcf5a6cd60 --- /dev/null +++ b/1b_layer12_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c630c0f91aa2332a90e4ef0475a58f413410dfef4f285cd2b8ae8bf7e9d716ec +size 66700876 diff --git a/1b_layer12_mlp.up_proj_input_pretrain_representation.pth b/1b_layer12_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb68b3cb619e3095e98b14560359a322c0724825 --- /dev/null +++ b/1b_layer12_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddf41e4b97924bdf2268085646ce6910f5b20c43391bcece19aaaa8d73c0168 +size 66700797 diff --git a/1b_layer12_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer12_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..526750c10726240b95532a6ec6b05a770d1245c1 --- /dev/null +++ b/1b_layer12_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4bdd010ecd7698ee42110a78ac2017de46e5a6a0d8a3b510fd12d77e16fbe8b +size 66700886 diff --git a/1b_layer12_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer12_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce87c9fdd4270082dbfbc74b670746bf0f4f7590 --- /dev/null +++ b/1b_layer12_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d86d9ef25ca91fe4e6fc960fc4fb04d554667a69e3a3783a08d07e85d89eeb +size 66700886 diff --git a/1b_layer12_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer12_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e571382cfd3ff8af53c691450932b4c74c6ba7af --- /dev/null +++ b/1b_layer12_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfbce488f47f03cdcca7bd2b713e371a7b20fc2f837f629fceb6b9a4b72a0bb8 +size 66700886 diff --git a/1b_layer12_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer12_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f965456f41889bdf5941cc83c36816f2a4313f6a --- /dev/null +++ b/1b_layer12_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733e773d18ad7b290467d3a28190ac981be12ede17f8fd8f3050580e71acda65 +size 16676443 diff --git a/1b_layer13_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer13_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a4df0039706956ac23017472c3747a44ad6a4cfe --- /dev/null +++ b/1b_layer13_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5995460b74bda353c5b065d296c6bbf2190d33a3a1c98aa6e03bad8feb4e521 +size 66700886 diff --git a/1b_layer13_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer13_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..144b58aa3847638c1eee289838b3c86b44406187 --- /dev/null +++ b/1b_layer13_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e635f35547b3eed65bcdc8f3fe35f94139ed309825d84105f70a135c03320083 +size 66700891 diff --git a/1b_layer13_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer13_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf7524089ce6ff49874691cc20cd5b724bb8166b --- /dev/null +++ b/1b_layer13_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:629be50af0295ff5d40a69d8a160ff2aa4b72b8c4fe19659f435c577feb3a44e +size 66700886 diff --git a/1b_layer13_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer13_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..99fe99ff5a881b5acc1a6883201446b45c143629 --- /dev/null +++ b/1b_layer13_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7b5b61036d1dc01b9ccad708a6789597b4483ede43d1e50c6d2dd0f92aee6ce +size 16676443 diff --git a/1b_layer14_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer14_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..763a50c293aa808c509594e2e0c6a1d59de20e02 --- /dev/null +++ b/1b_layer14_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f36fc4a0ab303136602b57318057a6a568da6dd8c661fe4b4b663e46ffe9ed4 +size 16676443 diff --git a/1b_layer14_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer14_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4de557230a13863658a5469881478794f3c3395e --- /dev/null +++ b/1b_layer14_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463966623efc74df386a0fd2669f41eb50d85c50a1fd6f8fba39e557a2abf68e +size 66700886 diff --git a/1b_layer14_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer14_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c68e701a55aba9f8a432bcaf860e6b21038f835d --- /dev/null +++ b/1b_layer14_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d68dab57a7e18bf5e1693e5a18ed1d02468ba4eaadb0014d640e38e2ede864 +size 16676443 diff --git a/1b_layer15_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer15_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e46ec99732595bd11e51686764a8c816ed29fb4 --- /dev/null +++ b/1b_layer15_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bce9fd80bdd484d4bc56207f17204b175e44bcaaeab17b0dde70d90d726842c +size 66700871 diff --git a/1b_layer15_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer15_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..020360efc9ba49387d58d8794048c30e9b5a39c7 --- /dev/null +++ b/1b_layer15_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd11458dfd4b64462307e4d320d17783716eb665f554a64090b9b75d6a06256c +size 66700886 diff --git a/1b_layer15_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer15_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..38612bb9f2a64fd1c80f278a7cf6a12b43c26d52 --- /dev/null +++ b/1b_layer15_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc6767dde30c8896b5fe0f384310f87ff6d594ffe6a1b0e02511391e42d1230 +size 16676443 diff --git a/1b_layer15_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer15_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7fa9592385c8a9f04077c099fa2d580c7af0b049 --- /dev/null +++ b/1b_layer15_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4dd8435854ca43e561971fb76bfa29c24eca7936c956528201f6a46f3751065 +size 66700886 diff --git a/1b_layer15_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer15_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2b7dfef9909692c4534f33f7795d0a812c7398f --- /dev/null +++ b/1b_layer15_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a285fde85618550e8732d42ac7fdc08073f9b347f4e33661ba96e49bd2adcca9 +size 66700891 diff --git a/1b_layer15_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer15_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f1526f21861eb281a88800fa85078ae6c9381a21 --- /dev/null +++ b/1b_layer15_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b39592f2fbe474fa57c381e9d91578eb1229fe99263b3963c2e5738f5f0485 +size 66700886 diff --git a/1b_layer15_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer15_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..de28fd03266aa0b7eaf64940b48d08eb1220ef42 --- /dev/null +++ b/1b_layer15_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8693a061852decf05e76d3980e4c32c1e8d7c85b5b9131564470fe0af8b75520 +size 16676443 diff --git a/1b_layer1_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer1_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f11c0bd4834b21a1c511e188188893cf0a0b07a6 --- /dev/null +++ b/1b_layer1_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c5d73e268ca59ade0c77bfa60e550d18f918fabe1c7457ff5372a5130f877a +size 66700802 diff --git a/1b_layer1_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer1_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..52e2bf6eb70ed32ffbf618082d958bd712307587 --- /dev/null +++ b/1b_layer1_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b7120ca0d673fd061c4bc71f838af8d0e9f20ac32b622aea7c61d31efcebfe +size 66700881 diff --git a/1b_layer1_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer1_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..96c3668adfc29c4762edd8ec4f31fcfbc029f619 --- /dev/null +++ b/1b_layer1_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7102d9ddbaba2e3ad6dfab5dec8d1e0a506138deb03ed1a951f69c4e2bd2926 +size 16676438 diff --git a/1b_layer1_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer1_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5d6edba1685dd1367f68dc2b0319cc2b0ec79d8 --- /dev/null +++ b/1b_layer1_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6995b582d8794ea3555aab97bd89ef580d0fbffcf2ab03c795ce2cec9d38bcf5 +size 66700881 diff --git a/1b_layer1_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer1_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e4f2a8f760a6d6efa3110653260f90dad216477 --- /dev/null +++ b/1b_layer1_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24298bbdbc4705dbba498cdc0a50e8e162d8d1e9f772f91bccb9d4cd04bd0eb3 +size 66700886 diff --git a/1b_layer2_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer2_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7bdc1eb0ad47beb8fe20416526b028b9a47e2fad --- /dev/null +++ b/1b_layer2_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d570748a8cdfcb06e4e6a927d07e01e1ca0904ef57877c7466af92fecae92f +size 66700881 diff --git a/1b_layer2_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer2_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf3faa1bc42323e0efb99f8b9df7eb77150d4b4d --- /dev/null +++ b/1b_layer2_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2217670f48027c93271b43c0683d1b8d88951a65b93d6cd085450ba244e735f +size 66700881 diff --git a/1b_layer2_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer2_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7d0f4f17905e9b73babaaa76afe2e49e68d3cc0 --- /dev/null +++ b/1b_layer2_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf3c21523a43846909eafb3644a2e274df28afcd89de37fc8c95180224df5d75 +size 66700886 diff --git a/1b_layer3_mlp.down_proj_output_pretrain_representation.pth b/1b_layer3_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..56c4be865eb5a55faba57b0612351040f9197312 --- /dev/null +++ b/1b_layer3_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdee2da11f01ca78a7dd03105db56afb6eef1008e3fc9eba35d8431cc4dd3e60 +size 66700871 diff --git a/1b_layer3_mlp.up_proj_input_pretrain_representation.pth b/1b_layer3_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b00b0417f665e58d2508b78ef78b6e9b6b5d447 --- /dev/null +++ b/1b_layer3_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9922702450686c5e15cdf0eae9553c43e4cccaeef27fcd5e58d37da74d945c1c +size 66700792 diff --git a/1b_layer3_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer3_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..57a779ced85548f3beb0b0c082696a2cc3990c1f --- /dev/null +++ b/1b_layer3_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b226a254b3677c53d79d5a73db255b3d116fdf92a418032508e247a7ec9a199 +size 66700881 diff --git a/1b_layer3_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer3_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7571f2b8c9634a794fcad0a6cddd169ce0414fd1 --- /dev/null +++ b/1b_layer3_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a52721b9e4f30115375e83477fd366bd7c72bc66792a2e42be485d14de38989 +size 16676438 diff --git a/1b_layer3_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer3_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7a5fad1c4438a58b7442568b50a3fbaff7cae13e --- /dev/null +++ b/1b_layer3_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c6d1c84b41ade7024c36318f50da59835be8a0c8c73839f08d4a24c44d80f1 +size 16676438 diff --git a/1b_layer4_mlp.up_proj_input_pretrain_representation.pth b/1b_layer4_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e34cc981333ca73f6a1e74e380f1e271e450867 --- /dev/null +++ b/1b_layer4_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b15b186bb0ff7592ee1a09280d2c95719c760cab0e9e99dfc1df145610929d +size 66700792 diff --git a/1b_layer4_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer4_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd67f97c795d0516646bbf6f7a2c179b5b588833 --- /dev/null +++ b/1b_layer4_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8945bebd2fbbb492e7fda18a25454376ddf73b4a1905570b712668e2defb5863 +size 66700881 diff --git a/1b_layer4_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer4_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f13f6c133497c34df541469ad8600a4e13b3bfc3 --- /dev/null +++ b/1b_layer4_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720535dfc52a918eb37a61d1997cf3f249d70b044972b23b834ee9f45c3fc5cd +size 66700886 diff --git a/1b_layer4_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer4_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..149ba7d9293adcc0b6778571292a7cace03b5afb --- /dev/null +++ b/1b_layer4_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a754b5fa07100c5c77ecf8c157a6b940d54c52ad583fabf08fe5f4b59acbd4f +size 66700881 diff --git a/1b_layer4_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer4_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..083bb489f9865f8a7e74ced4f24552d6bd2bf543 --- /dev/null +++ b/1b_layer4_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60c0273692e1ef994b6a3ffeb0dbc1b52dc4991c35c6405f565f712b8f8042a +size 66700881 diff --git a/1b_layer5_mlp.up_proj_input_pretrain_representation.pth b/1b_layer5_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cc08529844965e0860af4e876dd8234bab3b7dfc --- /dev/null +++ b/1b_layer5_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44d2bbd097e9ab9740445904002f1bd12edd1ef34d477edd3561edda97803bc +size 66700792 diff --git a/1b_layer5_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer5_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4681617eee1137738ab832a980bf6d2e41b9feee --- /dev/null +++ b/1b_layer5_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a078a7f4329fa71517238d155ef1fdbd4783f2b8be3a4546f2222f9793d9ad +size 16676438 diff --git a/1b_layer5_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer5_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f07b4b48e9b119aef7fe3d93131e3969aba1959e --- /dev/null +++ b/1b_layer5_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79286d6f422e60502834948aa275d14dd84fb2535792f43847e82e1d76fe5a27 +size 66700886 diff --git a/1b_layer6_mlp.down_proj_output_pretrain_representation.pth b/1b_layer6_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f089c76ae11780cfd297c742129007609b8545e1 --- /dev/null +++ b/1b_layer6_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db097e869c25b3206da0747d95ec393ff206b75db2be5f68468ffb31abcdebf1 +size 66700871 diff --git a/1b_layer6_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer6_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..def5130d0155bcf2cc7713b4106db6fe106962c5 --- /dev/null +++ b/1b_layer6_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30155732e241218fee027054c131ab99724f234708b75359f7fb450637f8eb74 +size 66700802 diff --git a/1b_layer6_mlp.up_proj_input_pretrain_representation.pth b/1b_layer6_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee6f7ad3ec5b6acb15867204ece96751b7e62a33 --- /dev/null +++ b/1b_layer6_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e18c314265335e019c175188709b4ae82f7ef8409b9253cb03964015a9308d +size 66700792 diff --git a/1b_layer6_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer6_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7ababa7564757d1226289a28ea7301c6ec80120 --- /dev/null +++ b/1b_layer6_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff29fc64123404e85525f492a5922924de9f3eb7d3935dc026ef5d08359e74a7 +size 16676438 diff --git a/1b_layer6_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer6_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8835dc4b17d2505198fb40abef0ef1da99898130 --- /dev/null +++ b/1b_layer6_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:274e405f59fb59005ea7cd59ebe6bbb3a3fe6524e8bb3145a86e357a1010ac14 +size 66700881 diff --git a/1b_layer6_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer6_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e7686ba1505b4864e59ee9afe0b29dce339059d --- /dev/null +++ b/1b_layer6_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53b9dcef30e3a0f7e676571fcdfd03d20cc0db126c3280dee15773e9a81cd49 +size 66700886 diff --git a/1b_layer6_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer6_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc9a5b08c332e9efbd3a401d1338620187849893 --- /dev/null +++ b/1b_layer6_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3d6e55864504cf200e9cb9114ca7582e095423376d88811e121b237ea2a527 +size 66700881 diff --git a/1b_layer6_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer6_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d852bbe88ea4d4408886348128b47474633478dc --- /dev/null +++ b/1b_layer6_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428fe88fd1b7bb91d688cae33a4d554d13186541a4193b61025d90945831e230 +size 66700886 diff --git a/1b_layer6_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer6_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e131f7d29b075557a227dd6a803e4debdacf500 --- /dev/null +++ b/1b_layer6_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9819127e83aceec0c859c7657097335b2c72fec006349ed32580ed6c46d7ff4f +size 66700881 diff --git a/1b_layer6_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer6_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7543eeac33d3a8b33fbfad368181aefc7b1301fe --- /dev/null +++ b/1b_layer6_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aead63ed389558a20826ccda784955a93e9298d6bdeff1199b7d00c1018734d +size 16676438 diff --git a/1b_layer7_mlp.down_proj_output_pretrain_representation.pth b/1b_layer7_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..60cff080383dd627f2aaf079a42e0fe6417945d4 --- /dev/null +++ b/1b_layer7_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db5e4ac1f9a0ac411331710aee0e55d5dd825f7a20e14d0996dc62bc63d1580 +size 66700871 diff --git a/1b_layer7_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer7_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..55690d4bb1d1c8a212866bb93b2635c4b8398209 --- /dev/null +++ b/1b_layer7_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257e81898202091d815750d4503a4301375d3f606c0e7a2228e0380e7f315b20 +size 66700802 diff --git a/1b_layer7_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer7_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3b13675c6c44847800c34b505c8b364fcf0a4cc --- /dev/null +++ b/1b_layer7_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76fc16a9a8ec0fe131353ae03edb9404a0f46334edcf797ea749120d00eff11d +size 66700881 diff --git a/1b_layer7_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer7_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8def1736a0452f22e02a26b383e36a8d5626fe65 --- /dev/null +++ b/1b_layer7_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46c9f962e7315f6112dd027f80fcc0ba594bbd93197d5cd540f9cbbd2183253 +size 66700886 diff --git a/1b_layer7_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer7_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..520d9804e5d4a5e3e317bc82677574f4673adb50 --- /dev/null +++ b/1b_layer7_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6cdb6508dd02f1f245819166efe9f5f2cc7fc96db6852f6ed338500af46aef +size 66700881 diff --git a/1b_layer7_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer7_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b52792049ab2aff7999bec5658f35040dba242fa --- /dev/null +++ b/1b_layer7_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5b79a42519362fc47b9f6037a1b761e78f19b132201191d051cb3c10a4e5e7d +size 66700886 diff --git a/1b_layer8_mlp.up_proj_input_pretrain_representation.pth b/1b_layer8_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..83fc00faaf62c611ba5b99493e0cac6c62d0d220 --- /dev/null +++ b/1b_layer8_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e87fb8844282cbf7891def65a1a983c92e688a86946d8c140f896a707cdbdd +size 66700792 diff --git a/1b_layer8_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer8_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e5422b47ea9359d8a91f1931334ed65ef8fad46 --- /dev/null +++ b/1b_layer8_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4918e3f76e0911ccbec4f677bc9ab7639d7de7a7cb33cbbae84375d1adeaaae +size 16676438 diff --git a/1b_layer9_mlp.up_proj_input_pretrain_representation.pth b/1b_layer9_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8978b64c58b56692d5a57336a576c92fac46583c --- /dev/null +++ b/1b_layer9_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4623785244cff07c635f866ff399ebc04408ae4c436c61c68e47bfe047f8f32d +size 66700792 diff --git a/1b_layer9_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer9_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba5116a2d563ab73b336dc87a16e84e52a01c28d --- /dev/null +++ b/1b_layer9_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:576ca36fd3779d52e3ce9c494e282451cf6a22eeaa9e7a92567650dab9a0e61d +size 66700881 diff --git a/1b_layer9_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer9_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..42ec5325ff435f44310a059cf5079298100dd7d9 --- /dev/null +++ b/1b_layer9_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b71e50d5fa26927b5a3c044b33891b788d32d05dc274e73b62956e24f807aa35 +size 66700886 diff --git a/1b_layer9_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer9_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e07a5eb85ed766eee87b8037df3d5e2d67316be4 --- /dev/null +++ b/1b_layer9_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea5397cc4480655b55337cf61513282904daba282a1ee551c212dc8660e7a5a +size 66700881 diff --git a/1b_layer9_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer9_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..82ff8e7161ce92501455447a0f4237da1605f67b --- /dev/null +++ b/1b_layer9_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12d1c8ef93d40a8444dec95938a6c3ebf4c05071481126cef7ae2bd911e56e4 +size 16676438 diff --git a/3b_layer0_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer0_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b4017c6c6164a5d2657bd65d2baadbba76008ebc --- /dev/null +++ b/3b_layer0_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646bc0bfe54b9a5368e15764be01291d2ac6a531cc35ab445048cdd01a745f67 +size 133391953 diff --git a/3b_layer0_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer0_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a82f34ea17b25a2fd414b7c011e39f63c35b94f --- /dev/null +++ b/3b_layer0_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8110a81a875a7730a0508e0f17ad0a0f1017f09d841dce7c87685cc1c12f7a35 +size 133391953 diff --git a/3b_layer0_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer0_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f82c691d4a862826cd87184fce866f549b14609 --- /dev/null +++ b/3b_layer0_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5843dcfcccd20fc625654e362bde03cd155472af9c2e945a2f1c65a85c014eb +size 133391958 diff --git a/3b_layer0_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer0_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4ce03e8a09ea2a674d92c8350a2d9c3ebf9fa13f --- /dev/null +++ b/3b_layer0_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79c2d042250ae3719f8f83774671190fa12fca838fadc475da264be45d514cb +size 133391953 diff --git a/3b_layer10_mlp.down_proj_output_pretrain_representation.pth b/3b_layer10_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cc1cf69cf92e41c92ac4132ff2ec4284c047bda7 --- /dev/null +++ b/3b_layer10_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee4cfaecaf491b50f9b61fc4b40b7a9fb6a89d303ff82bdbd46e344ea8bac09 +size 133391948 diff --git a/3b_layer10_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer10_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..24cae5883452435d7e755876beffe5b3d247f007 --- /dev/null +++ b/3b_layer10_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ebe2aa3ac24575d06e5afda9c6294cf59386f7973a62f21c07b8124207f0664 +size 133391943 diff --git a/3b_layer10_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer10_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc791409948f003def1cb25c7318d373a8adbd39 --- /dev/null +++ b/3b_layer10_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e69b4eef5253e6a98ed0475062c176b109bc5366c1526c2ada9138d26b0363 +size 133391958 diff --git a/3b_layer10_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer10_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..40abc51f771970c3be1d5a86718fdcc08da237dd --- /dev/null +++ b/3b_layer10_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb455956caf0ecaf3b50baf3faaeccfcb3ba8d8d97bf0207ec3771c6f9558725 +size 33349211 diff --git a/3b_layer10_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer10_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..57f501c302cbbb5bcf7702b82faf7383818cea3c --- /dev/null +++ b/3b_layer10_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeea9b4927149e361b034b7d33c5cadfe34fe8eb4ff0c093c2c6eb8ae5305d3d +size 133391958 diff --git a/3b_layer10_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer10_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..74c7ea13572960fb7e4d5a1f72d5aff218ff41b8 --- /dev/null +++ b/3b_layer10_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d054ab4875d7734e319278e248ce242b45c7d01875b1ff12e61ce78be232a4 +size 133391958 diff --git a/3b_layer11_mlp.down_proj_output_pretrain_representation.pth b/3b_layer11_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f529a7285e23c5c50a28ce7591ed257cfbc60151 --- /dev/null +++ b/3b_layer11_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a84407723623ffa781475f3362c3c15a48426d936f636b12913f05dce62646 +size 133391948 diff --git a/3b_layer11_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer11_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae4390d6922826645aa8361fd895929de114dcfc --- /dev/null +++ b/3b_layer11_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01f5230a196e887a9b11a04295b410865ffdbff70d310afe557a7752788c2fd +size 133391943 diff --git a/3b_layer11_mlp.up_proj_input_pretrain_representation.pth b/3b_layer11_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..00216beae6953b89f677f1d0097677decf14b5e2 --- /dev/null +++ b/3b_layer11_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09fdc10bd66b06d612939cbf3e2695ae674db10667f2488eec71c92f60da217 +size 133391869 diff --git a/3b_layer11_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer11_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9cb195c31e0a6664d55404eaa1b18cf645c11221 --- /dev/null +++ b/3b_layer11_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6bb74a2eaed0e98c7fda4128ca7e3197a7b1d5e68258890e2c8faac5704bcc +size 133391958 diff --git a/3b_layer11_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer11_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..092110fbfcd8fa7788503f2a7bb8dc6cb221a9e0 --- /dev/null +++ b/3b_layer11_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876c4e9b7421a9b89f24da86a4eb5d248313a51f9029466a0f153dcf59da20c7 +size 133391958 diff --git a/3b_layer11_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer11_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e1e3d7ee8da8fdbc850e2e17630da294eb64b7c --- /dev/null +++ b/3b_layer11_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd09e50aa6a82f74791ded7ff8f1821bf73743d90dc6d68551708473e6cbe3b +size 133391958 diff --git a/3b_layer11_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer11_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e41906b99e76917a03d44d75a0b15936a8cc390 --- /dev/null +++ b/3b_layer11_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ccbec2d28d33aeb8633d7220766182bb3da74176633601fdf8a9efb3e29c9e +size 133391963 diff --git a/3b_layer12_mlp.up_proj_input_pretrain_representation.pth b/3b_layer12_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..79cbb4f86b9993546f37abeba9f8da20a0f1220f --- /dev/null +++ b/3b_layer12_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97d72d5df42584a5a35af54c0edda5871f9ff78d67afd5445cb66f021698b4d +size 133391869 diff --git a/3b_layer12_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer12_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..52df46b07ad2b2102b4252563540fdb33b6bab26 --- /dev/null +++ b/3b_layer12_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8af3c8d387403d21693b9a6411d90b1e697319f5a249ada797ded731548ab22 +size 133391963 diff --git a/3b_layer13_mlp.up_proj_input_pretrain_representation.pth b/3b_layer13_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7150cba273e0f6d8ba300d139f3494efd3ead273 --- /dev/null +++ b/3b_layer13_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf037a725e1697b5a9acfc3134c295423052fcedfd6e5a5864ddbd6b91c10e0c +size 133391869 diff --git a/3b_layer13_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer13_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c9a541975e6d951e623113d0215364f85c7a309 --- /dev/null +++ b/3b_layer13_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b0e07acf99d59f162921ffbeaeacc542d1922b8c84d89c2b0f950c4b9805db +size 133391963 diff --git a/3b_layer13_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer13_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7af7857695f5023ce33f97998bb3ffcba6fb9eca --- /dev/null +++ b/3b_layer13_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d77b597cb7ee410870d8e40d4401208ca83dc7a25417d4515c4bf60d9a11b86 +size 33349211 diff --git a/3b_layer14_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer14_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4e5a487cf85d59138b88f95c8d50a2c7759c3039 --- /dev/null +++ b/3b_layer14_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da85400f625f71006b044206e9e5f992c6a2d570a4cae6bffa9a733b174a488 +size 133391943 diff --git a/3b_layer14_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer14_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..09c6fe4aa165fce2f4f8d34ec2c986a2bc1d0bdf --- /dev/null +++ b/3b_layer14_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa427e713e7b5ca41e48e63c551e8f8a5ec0173408afef2eb3c78868734d0180 +size 33349211 diff --git a/3b_layer14_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer14_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..92d1c3a7b0ada49504fbd9dd4601d11b813056df --- /dev/null +++ b/3b_layer14_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3af17ef2d3c5c08be9d8f737ac3a8d0cd51fbf783888db8d422ee94f6fe18860 +size 133391963 diff --git a/3b_layer14_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer14_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb5728b86c3fccab8d61fab14c87c9383263a53d --- /dev/null +++ b/3b_layer14_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb47258f0c1788857488a1fbe9767e81838f4091884c95eb3ba8db8720a81c8 +size 33349211 diff --git a/3b_layer15_mlp.up_proj_input_pretrain_representation.pth b/3b_layer15_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..22189f861b1ea30c696d0f130b4b6e1f5ae87b48 --- /dev/null +++ b/3b_layer15_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3ce589d93623d7c63887eb805d81f1fd8979cc832df8fcabf43ad7330b1592 +size 133391869 diff --git a/3b_layer15_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer15_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..515ca4afd4ce7d876815e7c32075ff74d1606bfc --- /dev/null +++ b/3b_layer15_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57d08a1fc4591efb5d0a1c182eac5e60a9762d444da96e9c4d9073a7d166cc6a +size 133391958 diff --git a/3b_layer15_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer15_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..39b0831a6014de0bc505c470f901390f26a965ab --- /dev/null +++ b/3b_layer15_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c0183d7787403f29b6f0dd5b4e6842284d6f5b4259084974e7e7b70f447c83 +size 133391963 diff --git a/3b_layer1_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer1_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..68d03a5675ac7b0aecc2ab7916634ba0f082ad43 --- /dev/null +++ b/3b_layer1_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752c4c4cb95c9c6fb05b47b18c275782f0bac2318a8dce608ecba033fb1d0dd9 +size 133391953 diff --git a/3b_layer1_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer1_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ef2085cbae7d7c46f81fde8927e0b66d41dde6f --- /dev/null +++ b/3b_layer1_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6608ab16652f04335db331213b62d60f66e8f3a08026e1dddaa1f1c7b3e5a4bd +size 33349206 diff --git a/3b_layer2_mlp.down_proj_output_pretrain_representation.pth b/3b_layer2_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a08e882c728fc1c18980e537cdd231c4843c41da --- /dev/null +++ b/3b_layer2_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663aaab51e29149da17821314246505b9fb6b3bb860bca277cf51df9981bd08a +size 133391943 diff --git a/3b_layer2_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer2_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7a8abc04f60b4fecd82002af0219e491d73d11d --- /dev/null +++ b/3b_layer2_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dadf0ca2a96b99a404f43c0b3fff7b197a9b9e929e6a45327dbfe5e0465ccc0f +size 133391874 diff --git a/3b_layer2_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer2_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d3416edf18b6cab8925a10f290edc95f86ff5c6f --- /dev/null +++ b/3b_layer2_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6c4672ad321e699165b6bec6eacadb605ca179e1fb83623a2642fde561dfae7 +size 133391953 diff --git a/3b_layer2_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer2_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..506abd83c2eac6960a74dde4b091979dc796b66c --- /dev/null +++ b/3b_layer2_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d890265eca39a1de4e18ac31c054af6bb2493963403ac561f2918ec7d2ac5952 +size 133391958 diff --git a/3b_layer3_mlp.up_proj_input_pretrain_representation.pth b/3b_layer3_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bfa9a54656cb6a0a74b667a950286d34faf93582 --- /dev/null +++ b/3b_layer3_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36ffb8b6cd15f5b7a6b2be26c01f56aafaaf42872a14c481cf22596b5c8ac5b +size 133391864 diff --git a/3b_layer3_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer3_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8bcdaaf316a50c74c10663f08fe1444f22277eca --- /dev/null +++ b/3b_layer3_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e4d1070238c8c0f23f7e4aa20e9230c05bc6326a1d6aeeee25d62fabf8bc3c +size 133391953 diff --git a/3b_layer3_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer3_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1610c6fb51c3885fd67c1b5d7345c74cccae1808 --- /dev/null +++ b/3b_layer3_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:633b68ed8b41e5313ca449f5fdbc59a932dff0c98edf7103c67224ed0372ff56 +size 33349206 diff --git a/3b_layer3_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer3_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2abdb5adc09ca21a9c9063bd901aef94444b048a --- /dev/null +++ b/3b_layer3_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fccca1230331d2187fdbbb54063afcf6fdcccde68127520dddf73d0588f1372 +size 133391953 diff --git a/3b_layer3_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer3_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb43f2cbd9303417b452256631f03ed32b59563e --- /dev/null +++ b/3b_layer3_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf94488e03835aa211653f328fd9e940eeb175cc64e2fa366b889ebe9221ce5 +size 133391958 diff --git a/3b_layer3_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer3_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4cdc51b1639a18af0188a46b69233204ec7fdf9 --- /dev/null +++ b/3b_layer3_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c4eb8bd9bce89aa58dbb29eb8e34e963e5db3461adacd6802dc2d55ec545e8 +size 33349206 diff --git a/3b_layer4_mlp.down_proj_output_pretrain_representation.pth b/3b_layer4_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0541e93e354f4a556606bd3f012586ba88da2e70 --- /dev/null +++ b/3b_layer4_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d3ff007b67671785828f25dd341e2e9549211c3dcd1c50f80a1f14d5a5111c +size 133391943 diff --git a/3b_layer4_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer4_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..64dcef32edff96dc9c5fd15e297c3ef3799b571a --- /dev/null +++ b/3b_layer4_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70d76de4af2d5cbd52054be7d66f7ff01e6ce5b88f0e7d187a996d608541134 +size 33349206 diff --git a/3b_layer4_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer4_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ebfbf60a50aba7a7ad1696ae5ce8d82841e866d6 --- /dev/null +++ b/3b_layer4_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c5e306d60cdc3a88a1a369afb678dbeaadcf82d4952645148030d4d6d9556d +size 133391958 diff --git a/3b_layer4_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer4_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c94f02e6303b4d7b7a1b667e774753db17d54dd --- /dev/null +++ b/3b_layer4_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0492259eb0a6e7e550c06e04f21a0a18d91add480e9de6eeb2583db3fd12b47 +size 133391958 diff --git a/3b_layer5_mlp.down_proj_output_pretrain_representation.pth b/3b_layer5_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1a33fa461cbdbde3b16a4074d66afc73ab078e6 --- /dev/null +++ b/3b_layer5_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d9c4b11380a7172f198f75b49bf075aa4cb8ace9edfce8fc32b3119e279b33f +size 133391943 diff --git a/3b_layer5_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer5_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa1baa2909dbbe62d5b700e3803073b9c18dd05b --- /dev/null +++ b/3b_layer5_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062c108608a5bc26256056e57a20d0e30ef5c329444ec46743907301c10cfaa9 +size 133391953 diff --git a/3b_layer5_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer5_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d89ddf0e8dd41e86b3c35f03e388d057a6cbd7a --- /dev/null +++ b/3b_layer5_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1984288a8beea785bd0ece0450dec31678694733bd5f603f681015b4cbef86df +size 133391958 diff --git a/3b_layer6_mlp.down_proj_output_pretrain_representation.pth b/3b_layer6_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c89d825b2e2cc22841be2c30b4c504cddae4af35 --- /dev/null +++ b/3b_layer6_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810563c8ab983aefa3c036a26f9afe160fe90383dd94daecadc12d4bff72f158 +size 133391943 diff --git a/3b_layer6_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer6_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..78c99537aefd4487e5d8b729896d555826918361 --- /dev/null +++ b/3b_layer6_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9701d509786ecce72174f49249c4ee9a5ab89401d68971fd53686b6b8c4cc08 +size 133391874 diff --git a/3b_layer6_mlp.up_proj_input_pretrain_representation.pth b/3b_layer6_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..32e9649fc3bcb43db1c5afd9714878e4658b7f06 --- /dev/null +++ b/3b_layer6_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77035f09efe8e24455dfa15932dd8c910a2423b6a150aa612c1eeab724813149 +size 133391864 diff --git a/3b_layer6_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer6_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e75a2c8d8a8a64dd5027bebaf7f34bbd58d3e8d --- /dev/null +++ b/3b_layer6_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0a07fd6ae70687f5c9a2216c48f8bab988f27d5610e1d3be954700c63033cb +size 33349206 diff --git a/3b_layer6_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer6_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ade415b4ad6175b0037c5af42df5398a8cd50c35 --- /dev/null +++ b/3b_layer6_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6c9ec8e56ae15fdb82c88943d8e7d27e34b7be95eefb40eef017407e86e597 +size 133391953 diff --git a/3b_layer6_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer6_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..96ed19c05c1c26e847930a1c7b7a31671ca40eda --- /dev/null +++ b/3b_layer6_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67c2ca96fff21fa7b908c3d8d0fc8083ec2a5e7534506d8968147307c42312b +size 133391953 diff --git a/3b_layer6_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer6_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..93be3627f4c6d93f4065089b4ab3deb450101bb3 --- /dev/null +++ b/3b_layer6_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59381cfc92fab38dc118e953389f29559344e326fa1c527398b7c7657bbfdc74 +size 33349206 diff --git a/3b_layer7_mlp.up_proj_input_pretrain_representation.pth b/3b_layer7_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..898ceab1c9a8002970d224e3ed8ad54118fde67f --- /dev/null +++ b/3b_layer7_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f8c34173c4149fe4a1ed4f56eccd0716630fc3ef0ffa1bb32d4d13a1e11a9b +size 133391864 diff --git a/3b_layer7_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer7_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e044fae571eed06e388db2bdd5896b8222bef6a3 --- /dev/null +++ b/3b_layer7_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13da311f7c39fc92c45aa759ed0763d16e74ff959eb49bd6f72a8f26baa393b7 +size 33349206 diff --git a/3b_layer7_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer7_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f1de2037ad29a77617936e098ae09fd4a284c74 --- /dev/null +++ b/3b_layer7_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed884265e2242e74dfe02b77ebf6cbb9d5b89d5216da09230d3f2c7c578d8d90 +size 133391953 diff --git a/3b_layer8_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer8_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e62aa2c8317f21bb3b2e11eb100fbfeb2f718381 --- /dev/null +++ b/3b_layer8_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfeea4b8e2847b462ae60303d0085332d2ba4abaaa6bb4f79bf92359e7235f2a +size 133391953 diff --git a/3b_layer8_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer8_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0087d8f95596c2b0fc049a6074654f0bd0dad2b9 --- /dev/null +++ b/3b_layer8_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f6ea4413ea856f149fe07ea447c300dfb05315872ce2978a4f672e1506c03a +size 33349206 diff --git a/3b_layer9_mlp.down_proj_output_pretrain_representation.pth b/3b_layer9_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7729ed9f2d501d308d2fec3a3841b34fe4d4a900 --- /dev/null +++ b/3b_layer9_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f0a090e65d43617be12d7895a2d27a04e52125219ca2e944b67d4256ada500 +size 133391943 diff --git a/3b_layer9_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer9_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..91765d94caa3db59d15b40ad2ab6502a0d6d9448 --- /dev/null +++ b/3b_layer9_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1900b7bd9f6da9d0175d3bd5a13aa7a745f8bebeb6da051807acc73e1912ad8 +size 133391874 diff --git a/3b_layer9_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer9_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..41cfe97d54b6436e258248461429b5c2a3d914aa --- /dev/null +++ b/3b_layer9_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6662d2939c2767e42bc95bf28676e23d941253ccb5498ee88c2942b0c241fb2a +size 133391953 diff --git a/3b_layer9_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer9_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ee74fe8bc20d75f27fcc231216eee55cbe142b5 --- /dev/null +++ b/3b_layer9_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8cf944a7ccd906f66f9d19395cd62fc60fc5be0dd9e0f329ecd3d803438a2be +size 133391953 diff --git a/3b_layer9_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer9_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc584414320c339cdb7449b9a712e5b5000a07c4 --- /dev/null +++ b/3b_layer9_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5397d4f23352bdbb8d8e64066b33401f72c9ead71c884d660834ad4f06e05a +size 133391953