diff --git a/1b_layer0_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer0_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6286edc09ae19da1fdbca6fc6c1a8da2c75b0b2 --- /dev/null +++ b/1b_layer0_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eeb54e12133ed35a004b02ece90e5edc0c10e93e14054fade85dac44b7be1f5 +size 266798663 diff --git a/1b_layer0_mlp.up_proj_output_pretrain_representation.pth b/1b_layer0_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4219bd319349707bdd4f9011757caf0414206c0c --- /dev/null +++ b/1b_layer0_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcaa5c8e255df24c8f7cbce8fe95015c26447d07bc58854d0da619724b07810f +size 266798589 diff --git a/1b_layer0_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer0_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d3b354d8964e109e0df33376e7cbed2e6022a152 --- /dev/null +++ b/1b_layer0_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c6e303091c0feb745ac594d860d8f2a494d5ab6f6dd6334de4c361418ec6bed +size 66700881 diff --git a/1b_layer0_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer0_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f1a500c380fd07faa5e229f20f02fe9e76ffa76 --- /dev/null +++ b/1b_layer0_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37485b9c2827c79f4cf192a475c4c34e2c02f8392a26f406cdb48864e6364de3 +size 66700886 diff --git a/1b_layer10_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer10_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fac8a8c32adc3cf7c89847879418cd68f02e25b1 --- /dev/null +++ b/1b_layer10_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149437de9a47067a732ef162245d743ceee947770b05c21d2c25ed9a289a0e70 +size 266798668 diff --git a/1b_layer10_mlp.up_proj_output_pretrain_representation.pth b/1b_layer10_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0599140617e121ee86d4c3ca7353e0e7f848a058 --- /dev/null +++ b/1b_layer10_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f80ea519dac20e41b87cc778236410283d2c7b828470411e5a0af15327e32b0f +size 266798594 diff --git a/1b_layer10_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer10_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..004c58cce2dd2f6ab094a8cc7b22333be6c36a11 --- /dev/null +++ b/1b_layer10_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a641cc95f6f35f8eb2b7f483ba1e9275dfad601c81ef8acd8531fc86d627cba +size 66700891 diff --git a/1b_layer11_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer11_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a70efb3336a3625c2df2f9e9638434b04c51882 --- /dev/null +++ b/1b_layer11_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3033df9bec697ae5dd955d9cb9fdfca6f36d619b03bc0cc8c675826302ef0b00 +size 266798668 diff --git a/1b_layer11_mlp.up_proj_output_pretrain_representation.pth b/1b_layer11_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..abeba182436e60b9639da8553d2a26b77f36dca8 --- /dev/null +++ b/1b_layer11_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af66560b4a2d83c535897ced36940ed131654c931b9e112f7f621d4de5dcd69 +size 266798594 diff --git a/1b_layer11_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer11_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a8c789b6700394d5296ad0eb216db53bfa0248a --- /dev/null +++ b/1b_layer11_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fae8f0778a9549130faaa9203f0d5ea657882b87e522eec6b1aa9c5cb18af26 +size 16676443 diff --git a/1b_layer11_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer11_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff4f86a06f9215cee298cf8c620264ef6381c730 --- /dev/null +++ b/1b_layer11_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2610dac5161543cccd94e48040574638e47f044a8b384721cf5a7a3fbc6719af +size 66700886 diff --git a/1b_layer12_mlp.down_proj_input_pretrain_representation.pth b/1b_layer12_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7cd236176dc87966862befced04ef24a73978994 --- /dev/null +++ b/1b_layer12_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da2ca2b612d4e09e599e9a26b05cf9a6b21eb4afa41a5a8d44f92b9bb7c4b63 +size 266798663 diff --git a/1b_layer12_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer12_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..982ab862ce4d90b43af2bcceccc433526e128f6b --- /dev/null +++ b/1b_layer12_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d6ce838200c98a417d2f9037b953ef1071251ebecefce15dfb42c51238fc57 +size 66700871 diff --git a/1b_layer12_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer12_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..73332b44e693f7ad7cbd0b28594974029e8c97c4 --- /dev/null +++ b/1b_layer12_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840bf9d05de88d8ce18e5235edbe90bc45049e5daf24a171eb493bd6acde32d5 +size 66700886 diff --git a/1b_layer12_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer12_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1f92c312e6d1d4e099864fb9d1ad0c357044ddf --- /dev/null +++ b/1b_layer12_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee54514eccca909b0bf57640c5b7ebc5a87e0c9fcf8a46763d31e562c8b8dc2 +size 16676443 diff --git a/1b_layer12_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer12_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..13db7c63a63de80ca2a011707fe8f28c81a5ce28 --- /dev/null +++ b/1b_layer12_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e70a76cf53dda9be6c8c4de73f62b35dd2b10b68bd6839d03a94295959f3c4 +size 66700891 diff --git a/1b_layer12_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer12_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f6c797bf795c803d545abcc830ced6d8cecd3e0 --- /dev/null +++ b/1b_layer12_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c841a43f21a67906d6f082d8453d8ca9b688dc4e116a5d9bae1917bd50aefe16 +size 66700891 diff --git a/1b_layer13_mlp.down_proj_input_pretrain_representation.pth b/1b_layer13_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..185d509eaed85b0d11f59fe37163746884e794d7 --- /dev/null +++ b/1b_layer13_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8479e985883514c9b5108dcd0799df3f0286ea7f0fa0517a7755c857cd71860c +size 266798663 diff --git a/1b_layer13_mlp.down_proj_output_pretrain_representation.pth b/1b_layer13_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa9403e40835594fbf31405522defc3a2c9b808a --- /dev/null +++ b/1b_layer13_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c277c7081bd67fa7f8ae1815f5f347282ba01da5775a4de0f16ca1645c5234e8 +size 66700876 diff --git a/1b_layer13_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer13_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2391824ae4552a3a1ce8335c4daefebc00efc783 --- /dev/null +++ b/1b_layer13_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1d199af0f56aa836b73db523d78e98394614178849d45f25ec0a9d2138fa9b +size 66700871 diff --git a/1b_layer13_mlp.up_proj_input_pretrain_representation.pth b/1b_layer13_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..37e19bd30f7a83b004d3677799aec086c5e106e8 --- /dev/null +++ b/1b_layer13_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b594127741d58a07e987ea1c0d6d129f73b6aa966bbe57035f4cb3b1a57b7888 +size 66700797 diff --git a/1b_layer13_mlp.up_proj_output_pretrain_representation.pth b/1b_layer13_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..82fc5bcf36a3e7ffc330765c7bc4bef9d3fe1ca5 --- /dev/null +++ b/1b_layer13_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ff0e58800b7ea59cadd89f6ea3f52ea3134a0e82d7516d9dbebf9c903f256d +size 266798594 diff --git a/1b_layer13_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer13_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f714b9d4834b87e5cae9c8a640c84af55b692c5d --- /dev/null +++ b/1b_layer13_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ebdf1e398fd9ca612a89560dee4b592e1ac600cf9cd1ae7e733ecda2d28574 +size 16676443 diff --git a/1b_layer14_mlp.down_proj_input_pretrain_representation.pth b/1b_layer14_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad5dec8bb04c68442ac1e822fb4108cdedd7ab0c --- /dev/null +++ b/1b_layer14_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fccc6117d83b2f02db1267e52122d4dc23ba62c69241e720a74f3b2d620405 +size 266798663 diff --git a/1b_layer14_mlp.down_proj_output_pretrain_representation.pth b/1b_layer14_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cbe9980f4feb44d2b32ebc1ce867ca7a1b282f12 --- /dev/null +++ b/1b_layer14_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50979b8502eb47643dd200ef9b6cc3b1a9c044849634907deee807b3683ce43 +size 66700876 diff --git a/1b_layer14_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer14_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..467d07d84ad8a5be5c0100c0c77e37af5d9fafd8 --- /dev/null +++ b/1b_layer14_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:345f7c131daa294b88c30f55563cdcdcbe4609db896cead31eb2a798a282f5e7 +size 66700871 diff --git a/1b_layer14_mlp.up_proj_output_pretrain_representation.pth b/1b_layer14_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..961589d70eeeb32ea8a3659407ddc239aeea4565 --- /dev/null +++ b/1b_layer14_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7f2a8f3efb3067bbd16c501d5fc57e66832f94af568366dd15c7249e2d0cb6 +size 266798594 diff --git a/1b_layer14_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer14_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0d33c247169855ea5c5d1086a23539698d903d95 --- /dev/null +++ b/1b_layer14_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d24346c617c47f465dea6929ccd046d393042a4f0e0b12acb0a0a3f236a3695 +size 66700886 diff --git a/1b_layer14_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer14_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ed19f285990b99fccd24221a28eaeaa92c43e96 --- /dev/null +++ b/1b_layer14_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd4889fc8fc8e95318a29c2e54b834622f8437ec20f2894719294adcbafbc4d +size 66700886 diff --git a/1b_layer14_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer14_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..15bb6f6e56c1cb2c7e7ba287d4497d84998d82ac --- /dev/null +++ b/1b_layer14_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa35cfc19fb5805865dac51b2e125d0e5080bbd60e1f89eda886ceb296b92e4e +size 66700891 diff --git a/1b_layer15_mlp.down_proj_input_pretrain_representation.pth b/1b_layer15_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..26b33b0ad004eeddfc43c1caeacc98616d1f7f10 --- /dev/null +++ b/1b_layer15_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7773a072913dc62f1bcb8391caf7d95f3db548ccdcad120653c8ac0d914287ab +size 266798663 diff --git a/1b_layer15_mlp.down_proj_output_pretrain_representation.pth b/1b_layer15_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7df022a5d49e4307eb194f58e6adea7a83e37462 --- /dev/null +++ b/1b_layer15_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d284e8be55305b485f2ae174454335db4362e39a81b3adc421df054eafcfa7 +size 66700876 diff --git a/1b_layer15_mlp.up_proj_input_pretrain_representation.pth b/1b_layer15_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d44d9a6a7a06aafbd3622c3bb4f39d184bf2c6e8 --- /dev/null +++ b/1b_layer15_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63ea5f9dc4c72314242c921f4fd194cf2d8f9f99a90d3dfbca1c5a33dd9c8be +size 66700797 diff --git a/1b_layer15_mlp.up_proj_output_pretrain_representation.pth b/1b_layer15_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4156c59b40cacea2a5c1b95b5f016d2eae0e8f7d --- /dev/null +++ b/1b_layer15_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f602c275573e9dc65be6d13082bbabd184fc36ed7299cf35797a0d5d4e621cae +size 266798594 diff --git a/1b_layer15_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer15_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..201c2196010573b1c8b8455e9ca014b9af0f2d36 --- /dev/null +++ b/1b_layer15_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68da57065e6573cc4f5b4711d96d5d528202da566e4376bd3c709a298f33653b +size 66700886 diff --git a/1b_layer15_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer15_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0cfaa9f60beb569245eaf3171b1ab33b69c0213f --- /dev/null +++ b/1b_layer15_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651b4d1756acb43ce5bbeddd1578889ffc83adde6b4da1f22ddc03ebaac840fa +size 66700891 diff --git a/1b_layer1_mlp.down_proj_output_pretrain_representation.pth b/1b_layer1_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0005380c9593757a6049f2da945a94a8cb576432 --- /dev/null +++ b/1b_layer1_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d6f876f53d5502c23e5b7b4cf57c332abd09030968c74ffaa2a925a8595c0fb +size 66700871 diff --git a/1b_layer1_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer1_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f6ba9e0d2f8f93775403e2759f118713fedec0a --- /dev/null +++ b/1b_layer1_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f783115a4db577d09d428af8793b9b6cf1d2264a46aa0c17f4b8bcd234f5077 +size 66700881 diff --git a/1b_layer1_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer1_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c1d09231f7161967f0afc9bcef23adfc1051382 --- /dev/null +++ b/1b_layer1_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34fa260abd98a937d58dea0cce844a3dd03037875270d454e4423846f844940 +size 66700886 diff --git a/1b_layer1_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer1_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8b0db9a66a96b997b6ee4b262ff284ee58f4243a --- /dev/null +++ b/1b_layer1_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310d8888614e5d2ad347134174d15ab3c2ff51a0fe10c62ec0e2a53951f6dab9 +size 66700881 diff --git a/1b_layer1_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer1_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..524925d4b904c32e453ef31edcb46dbc960d48f1 --- /dev/null +++ b/1b_layer1_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90434f202de6673bcb503863fb30c607303040ed8de5479c483a27fd805a6a9 +size 16676438 diff --git a/1b_layer2_mlp.down_proj_input_pretrain_representation.pth b/1b_layer2_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f61c58e756cdd1813535b03e1035317aa5eb592 --- /dev/null +++ b/1b_layer2_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f61df732e0dd374b1aa1e9ba719420e4b48d53b355242b9769b73952488bf65 +size 266798594 diff --git a/1b_layer2_mlp.down_proj_output_pretrain_representation.pth b/1b_layer2_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa01d54d920233ecde5e9febe1361c1639873149 --- /dev/null +++ b/1b_layer2_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a27b9dd5f22af24d14b685971aa3bfc2539861c63ab85b53483b14fb98d918 +size 66700871 diff --git a/1b_layer2_mlp.up_proj_input_pretrain_representation.pth b/1b_layer2_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7ff8a08e6db6c19edb6ec9f55935147f65172697 --- /dev/null +++ b/1b_layer2_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b93eb2f48f7f8c89fd18ecbcd65ab81da8ba4f69a838f07263617203f658ad +size 66700792 diff --git a/1b_layer2_mlp.up_proj_output_pretrain_representation.pth b/1b_layer2_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f87484eadbfdd2ea9e83c195063560e08757a81a --- /dev/null +++ b/1b_layer2_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d2dd4f5917ba01b50e1165923995ac0edebfd5299f5faab6c05efe1fc45165 +size 266798589 diff --git a/1b_layer2_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer2_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d1c42b5eb46bd9e16aa82b803685864579f0ecdf --- /dev/null +++ b/1b_layer2_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a7930a04b34c65658bdd5eb167295cd1a258b1b2b033c670b5ae153e2e4e88 +size 16676438 diff --git a/1b_layer2_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer2_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d148f8d58df38e3a48c501861c82fea53b1dcace --- /dev/null +++ b/1b_layer2_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a505c774f37c05e91899071fefc8f9a5248152fe4e3fcd62727f8e08c810031f +size 66700881 diff --git a/1b_layer2_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer2_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc87a00c396447dc4f89f6f32185e0d8bda607a8 --- /dev/null +++ b/1b_layer2_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d087505dc431703d56b4b8c630b256e5197c5298cf397efbc0656383b5c7740e +size 66700886 diff --git a/1b_layer2_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer2_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d99feac305719a71d08099a261f230b38ad3f4c2 --- /dev/null +++ b/1b_layer2_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:063c9a1cd1097d0a96e378ddd0ad46a4d7b5c5fc4be6fea89a156f28880c0ebd +size 16676438 diff --git a/1b_layer3_mlp.down_proj_input_pretrain_representation.pth b/1b_layer3_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d056a30270a18e3a6f47d9d0f7a99761b3189d2 --- /dev/null +++ b/1b_layer3_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd806db5a4425ecbdb09c6e0b27abc67cd2e924b4b53abc800564bac33ebd08 +size 266798594 diff --git a/1b_layer3_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer3_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5980dccc57bd417173dcc9af4eec48d2ace023ed --- /dev/null +++ b/1b_layer3_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c457b52eb9e7bb64b48b8b9c6c38778854aea4fc1acd6e9262ad014091a901 +size 66700802 diff --git a/1b_layer3_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer3_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c39b842c3d223c85e086d37c9b634a2fd02cdfc2 --- /dev/null +++ b/1b_layer3_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a3f1c6e40ade00ce8826e5538f4f3a7869a2a178295b018c63ef261333f416 +size 66700881 diff --git a/1b_layer3_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer3_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..98d41b93f5d1dc0000542f5c60bfbc89fd5e544b --- /dev/null +++ b/1b_layer3_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a876a2890476d507f6205272d9704d98443cd86f5c8580d694627e671c76327 +size 66700886 diff --git a/1b_layer3_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer3_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..59a0ba47ae553993736ac4c34c73fa74020d1d68 --- /dev/null +++ b/1b_layer3_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f877a672c940af0742cb3d7183186370301db74f1e30b2d2fa9b3e40066df952 +size 66700881 diff --git a/1b_layer4_mlp.down_proj_input_pretrain_representation.pth b/1b_layer4_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa2a99f9d1d4801e6f7c5b6ac0aca5c089d71889 --- /dev/null +++ b/1b_layer4_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0d167be36dab7f3e852238e73707ee8e854f70d215b1c14308866d66605871 +size 266798594 diff --git a/1b_layer4_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer4_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..672ed10a3fc047965cfcba1c0403578811153954 --- /dev/null +++ b/1b_layer4_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2f01fef69781075b86c535236a036444c0cedd8f9c9d036b555c41e1588ffa +size 66700802 diff --git a/1b_layer4_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer4_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4838e482eeddcbb90f9e8be1f79a6e2f7512c862 --- /dev/null +++ b/1b_layer4_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7028af1025ee017774f48988f91e8a6125abccc57fc8e3b5e31ade98f488da +size 266798663 diff --git a/1b_layer4_self_attn.o_proj_input_pretrain_representation.pth b/1b_layer4_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fc64a3d3facbcb8c9a7ea75953428fa0d6b450e1 --- /dev/null +++ b/1b_layer4_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf128e1e3aeb6d5d2b778380d44c331ffa86c63b7d88df002651ca3f4077e61 +size 66700881 diff --git a/1b_layer5_mlp.down_proj_input_pretrain_representation.pth b/1b_layer5_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..892f04f5bce455a800b6bec403e993fcc5dbf561 --- /dev/null +++ b/1b_layer5_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a3449432c6b039ec0eeab01f173529b67cc3fa4e8764c5c12a745153046ef1 +size 266798594 diff --git a/1b_layer5_mlp.down_proj_output_pretrain_representation.pth b/1b_layer5_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2811a659d5800c9050d334930304fa17dbd36f0a --- /dev/null +++ b/1b_layer5_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e85f2aeff26085207ce59625b3e4c2f177118b6ccccd7bf9dd46b18d4f456c +size 66700871 diff --git a/1b_layer5_mlp.gate_proj_input_pretrain_representation.pth b/1b_layer5_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0448ace4e9a8b909ed02c38954e45095ec74a450 --- /dev/null +++ b/1b_layer5_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10499252f747e981f92db6569e636d457c22dc43890b293085305891433fd13c +size 66700802 diff --git a/1b_layer5_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer5_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e445fbd6c8e333299eacde356f0134897de16aab --- /dev/null +++ b/1b_layer5_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55adaad11ea6d447a5de6025ba375f03686cfff4d6a557708b4b08a42db90e07 +size 266798663 diff --git a/1b_layer5_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer5_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..edcb347f4554b3e0db2558aacee92648bb7c3923 --- /dev/null +++ b/1b_layer5_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0be05ccb2219b9ebf8fbe00a3cc70809d2ce33ca2f9b4f18bed31ec777cccf +size 66700881 diff --git a/1b_layer5_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer5_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..033b7140eff26f8ef2231520d85bd80d5c41c9ff --- /dev/null +++ b/1b_layer5_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f87af1c7627163c2d3ce8d3a82e51f71ce4f858a9fc4c80b76cf1f23abd3b37 +size 66700881 diff --git a/1b_layer5_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer5_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..86e8a06905c662b4714fd4a2a20054dbce29331b --- /dev/null +++ b/1b_layer5_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a0fdc2636af53e5e4ec56a0de35478b0fc543221f27e0c7320f51d4c18fb2c +size 16676438 diff --git a/1b_layer6_mlp.down_proj_input_pretrain_representation.pth b/1b_layer6_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..64c4e62f2be337e7d89a066af256c944da25932b --- /dev/null +++ b/1b_layer6_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10dd6fd9e20b72d1054e1482b12db8342402f9eda13d4e7a3fe1e00fc27e073 +size 266798594 diff --git a/1b_layer6_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer6_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..56f96357b24cafc206cfcd4f64e44ede293bc6dd --- /dev/null +++ b/1b_layer6_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549f1e493f45a7e218dc045385f7bd68c9528b1b26e5c6f73bf9787ec8f35f2e +size 266798663 diff --git a/1b_layer6_mlp.up_proj_output_pretrain_representation.pth b/1b_layer6_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f95f73a4a28b5c5aca0aa352093dd35bb5b14306 --- /dev/null +++ b/1b_layer6_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05015c7eb687ad79464d78d01d5cd8f3c58d207fe6659fdf782cceec2fa32775 +size 266798589 diff --git a/1b_layer7_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer7_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..69bd1bfff341efb0efda26ba3d2f47d0c033bd61 --- /dev/null +++ b/1b_layer7_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6acff4a3a5f363e03772ba60a4c63962d5e03dfca5d3ccc8728eea2d5a4d1807 +size 266798663 diff --git a/1b_layer7_mlp.up_proj_input_pretrain_representation.pth b/1b_layer7_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e54664d5eab8688d0095c261a7b9fd43660c4fd7 --- /dev/null +++ b/1b_layer7_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d6e3f61e7ff55cd42d0277acea576058f1225dcee1644c1f0ea2f690430bde +size 66700792 diff --git a/1b_layer7_mlp.up_proj_output_pretrain_representation.pth b/1b_layer7_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac796b3ddd513065ce72263a2e90c506a9f0f49d --- /dev/null +++ b/1b_layer7_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2dd208c5997d7642f2d2ac048d0a880c895f9f9b8a53e53bccc42cd7630942 +size 266798589 diff --git a/1b_layer7_self_attn.v_proj_output_pretrain_representation.pth b/1b_layer7_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..77c8de8ce844ae59bf7e4d6951b7a85bb29f10fc --- /dev/null +++ b/1b_layer7_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:411b2ec505c4787e5daa92b347e9e4fb837e489fcba24e5967af9c187c65c20a +size 16676438 diff --git a/1b_layer8_mlp.gate_proj_output_pretrain_representation.pth b/1b_layer8_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee56b483ccc452dfc0051268745f75323b33d08b --- /dev/null +++ b/1b_layer8_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83ec35a9f2f6e8cf5dfcd3f4d04e26da8c459a9583993e4117cdf7c9b360d792 +size 266798663 diff --git a/1b_layer8_mlp.up_proj_output_pretrain_representation.pth b/1b_layer8_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf1ff74ccc2ab0db399ddc846c6f4c303f7996e4 --- /dev/null +++ b/1b_layer8_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ed5a163a45abd75ae2f00be5326a99a620b9b7398889288f6e25be013dbbd8 +size 266798589 diff --git a/1b_layer8_self_attn.k_proj_input_pretrain_representation.pth b/1b_layer8_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..43c6586911fdb323f0d02755fcdeac753225f4e5 --- /dev/null +++ b/1b_layer8_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb8141944b76bacf56562483f09af4160a1403e5a34336d886f159b2e2e743a0 +size 66700881 diff --git a/1b_layer8_self_attn.o_proj_output_pretrain_representation.pth b/1b_layer8_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e4fc0d05bb48b3b475ff073137edff4950cb5339 --- /dev/null +++ b/1b_layer8_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d6f2c66814b26dbea8291aaf8c1fb82872dc62fcc6dede81eea9b8bbdf1e656 +size 66700886 diff --git a/1b_layer8_self_attn.q_proj_input_pretrain_representation.pth b/1b_layer8_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..df5e4fb17bc675bb721394ffba67466f29afd179 --- /dev/null +++ b/1b_layer8_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5fe7929e596f65cd37d3be666df3a281a397b35824e53b58ffa345977ca3683 +size 66700881 diff --git a/1b_layer9_mlp.down_proj_output_pretrain_representation.pth b/1b_layer9_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..81427bb43d07da30ed0e55c11265c2dd463dcf32 --- /dev/null +++ b/1b_layer9_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a631133b7eeaa6f3ff7caa3654cca7b2fe1952ab7b7b42318e99bd4a373432c9 +size 66700871 diff --git a/1b_layer9_mlp.up_proj_output_pretrain_representation.pth b/1b_layer9_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..629491ab1acdaee1e615df03bd3d0760d126d286 --- /dev/null +++ b/1b_layer9_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbaa7711034c992c3326b66a9196c25b0211861923a668198bdc44f21a1319f7 +size 266798589 diff --git a/1b_layer9_self_attn.k_proj_output_pretrain_representation.pth b/1b_layer9_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..abc6694f8c89c974fd8ca7c4bd89b43a0fa39a92 --- /dev/null +++ b/1b_layer9_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb197471c7f72416e989c5a3fb56e8a5fb9e6faf62f71206c7f550c36dd9b6e +size 16676438 diff --git a/1b_layer9_self_attn.q_proj_output_pretrain_representation.pth b/1b_layer9_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..72853db0f0dc07136c474dac8c29fd2847aaaef0 --- /dev/null +++ b/1b_layer9_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf516298663f526c9380403db429c13510c5c210303851170fa75caa2b858834 +size 66700886 diff --git a/1b_layer9_self_attn.v_proj_input_pretrain_representation.pth b/1b_layer9_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c479f92bb26c54bc1ed8f5274a34fcbb414d8595 --- /dev/null +++ b/1b_layer9_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d475863cc6caebced01f49ed029f04ac28a9bfe443ea1c20df4dda9f8469c013 +size 66700881 diff --git a/3b_layer0_mlp.down_proj_input_pretrain_representation.pth b/3b_layer0_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f631934363adf76840612116064b2520f2d618d5 --- /dev/null +++ b/3b_layer0_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a70c5c865744e7410517cc3c6eb59c25cb91f590b0a22e4f841d07ea8aa8ca +size 533562882 diff --git a/3b_layer0_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer0_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2fca2458d5bde3e5906dec44646c81dfb09a0638 --- /dev/null +++ b/3b_layer0_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3e52ee5ea857f34bcdaf1718cbee2c0c49914cb7faafdbe0df0cc97a5c0dec +size 133391874 diff --git a/3b_layer0_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer0_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c8364d39e50d317d59fa8830ddf38b5854043458 --- /dev/null +++ b/3b_layer0_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b821f8789b704cc13b83f505231ba7c92d9a008d155b311f83c352401523fe +size 33349206 diff --git a/3b_layer0_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer0_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b7f6451d09a47e3512f1fab0b260848b5f549b9 --- /dev/null +++ b/3b_layer0_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd2849f495a30d2fbff99b5a8d280bdd5d9a231e10d9929c181660acab622a1 +size 133391953 diff --git a/3b_layer10_mlp.up_proj_input_pretrain_representation.pth b/3b_layer10_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f33417abec16f3473eb6e2a1426d5c42296bc66 --- /dev/null +++ b/3b_layer10_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b0256a51ef4021ad8a465f706edaf65ca4d4c3a1825f71f53c16da41629a0a +size 133391869 diff --git a/3b_layer10_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer10_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..28d377cb2c6d4e29b598e72e2673ce14d34b18eb --- /dev/null +++ b/3b_layer10_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef6b5404b924115f4be85f8a45350c96ec1e647662ffa797fdb705d958b9235 +size 133391963 diff --git a/3b_layer10_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer10_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6287bb0daab6e9eaf7db7fc93879d006622f2f80 --- /dev/null +++ b/3b_layer10_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf39d919275ceb34d1ea719b8bfdf22df1bdee8cd027ac595e4ea4281f51387 +size 33349211 diff --git a/3b_layer11_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer11_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1806513275f9fde50aff19d88b06e6757f49812a --- /dev/null +++ b/3b_layer11_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03dd291268c738f365ac542e723f67ccff77a9de1ecf04c0d5bfe5869017a77a +size 33349211 diff --git a/3b_layer12_mlp.down_proj_input_pretrain_representation.pth b/3b_layer12_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e56d7f3c5e1ed86fc6395054686eb853f07b58b --- /dev/null +++ b/3b_layer12_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d71312b3cb17a8988f7499b6a97ad80021a635f8f6f04289f0fd40ccbe2b097 +size 533562951 diff --git a/3b_layer12_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer12_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f04cc4dff9a546283e10ef93c63f910a4b4b4110 --- /dev/null +++ b/3b_layer12_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beaa493d8aed3c94e0d8f5acb6765075d4841767f2d8ead2341c492b1d33e872 +size 133391943 diff --git a/3b_layer12_mlp.gate_proj_output_pretrain_representation.pth b/3b_layer12_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2fc0a9a4436da85c39b708178b6f3a32542de2b6 --- /dev/null +++ b/3b_layer12_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f29eeaa47bbd2e2984a5304efb912c2cbc25095d5df29a6fe93b6fa94cb6c6d6 +size 533562956 diff --git a/3b_layer12_mlp.up_proj_output_pretrain_representation.pth b/3b_layer12_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..972436f008955591f06d7b2307bd5062e83c1a7d --- /dev/null +++ b/3b_layer12_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336df97089119f1b87d16a23da40090b2dc448fdda8c2b312ef0b874fb5a5d27 +size 533562882 diff --git a/3b_layer12_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer12_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..105919a8427c6ae992b84decb4ef2a2a2b8bea78 --- /dev/null +++ b/3b_layer12_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d752321d6e7f70baae4a0dd375813b1e740ad70fb8a27a7ddb7dd1e0a04564 +size 33349211 diff --git a/3b_layer12_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer12_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..159e457bd45ad0cc20f734d82e018312d4c86ac1 --- /dev/null +++ b/3b_layer12_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a5673d400f5b25a0281a61b1a1ecf43b07d173ee3d08375dfa7178dd49c3f55 +size 133391963 diff --git a/3b_layer12_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer12_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e9e752b4da6121879c008d9683bb2c1c391bddb2 --- /dev/null +++ b/3b_layer12_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81990247d2a9ef9184695e5116c07d8e31ef69f6b9ce40414eea8e3e57d386fb +size 133391958 diff --git a/3b_layer12_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer12_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdf4c721af57a249aa7d3c4045a19cb3b931d712 --- /dev/null +++ b/3b_layer12_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099ee60f869b4990056a4846f8991d45f6d1a452b0f5d79880f5cfe6f291c0b7 +size 33349211 diff --git a/3b_layer13_mlp.down_proj_input_pretrain_representation.pth b/3b_layer13_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..efb25f7fbfa23f01dc9c7e1a50d4af6ab5110e7e --- /dev/null +++ b/3b_layer13_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c034e1826205341922e850f0de36f73a29b0dee964f768ab7264294ee7684e +size 533562951 diff --git a/3b_layer13_mlp.gate_proj_output_pretrain_representation.pth b/3b_layer13_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5918cc7406dff54f01963f5d0b733cb43ee72035 --- /dev/null +++ b/3b_layer13_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3ca2378bc19c032a0e21677abdbd1aeb4aaa90a7eb641dd3d544ec4e17b829 +size 533562956 diff --git a/3b_layer13_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer13_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3163bf7731b39852c3e7ba89e579b9fb4c4dfc68 --- /dev/null +++ b/3b_layer13_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16076e7243a392b01fbacfb508b1e270d1b5fb87f9fbbe575d5f18e6fa7b11ac +size 133391958 diff --git a/3b_layer14_mlp.down_proj_output_pretrain_representation.pth b/3b_layer14_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..af109d251779537bb22fe694898e31e84262b131 --- /dev/null +++ b/3b_layer14_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993e5b2e69fd6cfc5b5b4b595815dce6e7d94f23c3f56007f0b77039a741bd29 +size 133391948 diff --git a/3b_layer14_mlp.up_proj_input_pretrain_representation.pth b/3b_layer14_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a59fb64a887df13a05f7ca5a9012a354673d2c5a --- /dev/null +++ b/3b_layer14_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad5ca20434061bd72ead41422db7ae6d9ad86bb61c53a35ea6ac9b03a3034fc +size 133391869 diff --git a/3b_layer14_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer14_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..668cacb5d3bd30ec23d202137e396bc37890aa41 --- /dev/null +++ b/3b_layer14_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61093ed054fd242194b3de07ea8e5f285c8e4f24e6b1a3cae476e4ebcd7342f0 +size 133391958 diff --git a/3b_layer14_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer14_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f8e0fab9ca63fb43188ab62710513034abddcbc6 --- /dev/null +++ b/3b_layer14_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ef0f4d4153dcabf3acf72f8875d3b52cefeb30e43ad8c43983a82b5e97a8a9 +size 133391958 diff --git a/3b_layer14_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer14_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cab17826dc52c4011ae498bd8cde4b9535bbcb51 --- /dev/null +++ b/3b_layer14_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4c4be8ad52bb06d17e8b39711622c1844cbcea09c9d69d2e35ea7897eac88c +size 133391963 diff --git a/3b_layer14_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer14_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..663b4bcafe134ac7f7877ac8a718c1000e11713d --- /dev/null +++ b/3b_layer14_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff81a81cedf07b1bbc8357fa963b0c9a6cbc92672424d3c60f09b2d3c3aab92 +size 133391958 diff --git a/3b_layer14_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer14_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2658cbcdd6a06ae46556852245ec862f788c2944 --- /dev/null +++ b/3b_layer14_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8df9dcc1f553b842f682e720e72d7cfeeeb9dd46e13d9dfc30ffa8c9c0c36d6 +size 133391958 diff --git a/3b_layer15_mlp.down_proj_output_pretrain_representation.pth b/3b_layer15_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..edcbd8d2bc83363b676e1750378a869a02765b3a --- /dev/null +++ b/3b_layer15_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae478bb57faeb97bf10fd55bda099fcc8edbe363596133fc167af6654ddeeee8 +size 133391948 diff --git a/3b_layer15_mlp.gate_proj_output_pretrain_representation.pth b/3b_layer15_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b4494fcf065638d49d47f76b6cbed46ec61909a --- /dev/null +++ b/3b_layer15_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb9370883b64d7116f0412b8879ef6a0ec4faf2edf48721ce777d8928522776 +size 533562956 diff --git a/3b_layer15_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer15_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd8a743f29a567eb2446aa674d7ff940b26b9e09 --- /dev/null +++ b/3b_layer15_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b5c46e568caf7cde889ec5914817972e28d10f7510295231ec617623ff026c +size 133391958 diff --git a/3b_layer15_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer15_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fb5ddd8e33559cb70228cb0fe55796984701cdee --- /dev/null +++ b/3b_layer15_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:715e847e6ff3f7c064c8c7a4fb907e98687c61eac8ace5ad5296e21c4f37a8f1 +size 33349211 diff --git a/3b_layer15_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer15_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f44458859f1c0a7e4c72439b7833948e8fe383b --- /dev/null +++ b/3b_layer15_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee222be8c90e6015fef2fb5946abd1b873a23629f4fbeeebf5e5021b3b63381 +size 133391958 diff --git a/3b_layer1_mlp.down_proj_input_pretrain_representation.pth b/3b_layer1_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e057d13a46aa7c173078e85b46fc1574e4dfc37e --- /dev/null +++ b/3b_layer1_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11097e086e587f3b1e41b7840fd796c7895e1c8f581a08ab5882c6522f42013e +size 533562882 diff --git a/3b_layer1_mlp.up_proj_input_pretrain_representation.pth b/3b_layer1_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..554756908be56fd92497d4ce604fc6ac47941969 --- /dev/null +++ b/3b_layer1_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e4ae899412aab781183793e4e61d1567e494248b75cbaabf087551e793d101 +size 133391864 diff --git a/3b_layer1_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer1_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..adda40e05ff563afc32638a44c8b7f6cd59fb25f --- /dev/null +++ b/3b_layer1_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42fb70cba12cfbfc526c214f0bd1c6cff8f83162eeb7e45f62060d427e39d286 +size 33349206 diff --git a/3b_layer2_mlp.down_proj_input_pretrain_representation.pth b/3b_layer2_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b4b1c64c83d335b9a9f2874c8cb3203f38ffe637 --- /dev/null +++ b/3b_layer2_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa2146584dfc3bc23b7d15af930175bc7eb7d529ba8943024b32286b07830295 +size 533562882 diff --git a/3b_layer2_mlp.up_proj_input_pretrain_representation.pth b/3b_layer2_mlp.up_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..15617eb6582afbb8bec075246a52863ed31d3f86 --- /dev/null +++ b/3b_layer2_mlp.up_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5092b003db07d360b0435c544a150431cf912a51dc6ba81c12e83d2867a1a43 +size 133391864 diff --git a/3b_layer2_mlp.up_proj_output_pretrain_representation.pth b/3b_layer2_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4010f1c7f3b050f420fb5c9ed42bb3c62114c39b --- /dev/null +++ b/3b_layer2_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d0eb9b09cabd63a0a657001f6466e0692ab1a64048c05bfddaf68dc133df49 +size 533562877 diff --git a/3b_layer2_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer2_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..300b4cc59ab4bc54613d6d370569dbc91eaffca7 --- /dev/null +++ b/3b_layer2_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9654c8ad26fcee42549a95bb8b56e8b89b7e8a6b6a403c1f6befffd64f390a1c +size 33349206 diff --git a/3b_layer2_self_attn.q_proj_input_pretrain_representation.pth b/3b_layer2_self_attn.q_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..37112c84a251c086755733e43f2672f608dd2a10 --- /dev/null +++ b/3b_layer2_self_attn.q_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd2968aac95bc062df79c4965d85abb7f1cdd112a36175dc6b55579dd52f5f8 +size 133391953 diff --git a/3b_layer2_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer2_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b928db378923cfafda7e13c15a7d840e2921a63 --- /dev/null +++ b/3b_layer2_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1faa58638d69b36f21e6c3d2ec4b47ae853d071a1f9e682946b31245abad99c9 +size 133391953 diff --git a/3b_layer2_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer2_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b313ea4865dc2c676439f2ce7d279f7df1536cac --- /dev/null +++ b/3b_layer2_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6874a6a6e6dd00704d6f97b39fbac3ab62bdd9006c2687388b8e547d76fecedd +size 33349206 diff --git a/3b_layer3_mlp.down_proj_input_pretrain_representation.pth b/3b_layer3_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a095353717f3bf47e000f2d746c267d12cec72b1 --- /dev/null +++ b/3b_layer3_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef0e791c138ede5c743f5f572c63e489fdf6a2f3b2900e05eebe90ca2dec4fd +size 533562882 diff --git a/3b_layer3_mlp.gate_proj_output_pretrain_representation.pth b/3b_layer3_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c8278367e1a85cb8e53bad4b79dad8fe51b3747 --- /dev/null +++ b/3b_layer3_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f32c06f0060784213c60f7ad78d573b5f1b9a93d8477f03d6d26432f69d4980 +size 533562951 diff --git a/3b_layer4_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer4_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5483976014ccc4d2c478458c3a01e3fc3dda87e4 --- /dev/null +++ b/3b_layer4_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212776bd9fd83b0e9e06d796e9df2da889fd7ee8d328357102edd47ff3ea1ccc +size 133391874 diff --git a/3b_layer4_mlp.up_proj_output_pretrain_representation.pth b/3b_layer4_mlp.up_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..06dfe1d6bdc7f5baab092594d50ec3b90afa416a --- /dev/null +++ b/3b_layer4_mlp.up_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a0b4215c1c595c3d21589b4619fdfcd243a5b4c9343a62ee23cc948132fe9d +size 533562877 diff --git a/3b_layer4_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer4_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..27bb058e10840f53a1aab9a171c23cdcabedae7a --- /dev/null +++ b/3b_layer4_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64cc4b36bf9bad41217108acb0449a43c0a62eb8e9c070cd66e101d0696a35ff +size 133391953 diff --git a/3b_layer4_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer4_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..db7766db364d35f1b7d4edc08d8a6ede7d48d24c --- /dev/null +++ b/3b_layer4_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d8da80c92bd78a1ede18790e42b23e6de9c811af39fe92ddaede1f04b81005 +size 133391953 diff --git a/3b_layer4_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer4_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fec058fcbbcb03925239cc5085f2345589955df2 --- /dev/null +++ b/3b_layer4_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77bfc8823e1387008c7ab89e5e72c778913c3bbf68c5d636b7f089a99fdf865b +size 33349206 diff --git a/3b_layer5_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer5_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e7ebb02ba8b7165e8a1a7aa698ebf3ae7a65514 --- /dev/null +++ b/3b_layer5_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e999a18a20fe37e4b4a037d344c6abf21ada15dd48d08f976a70902610135538 +size 33349206 diff --git a/3b_layer5_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer5_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a697d7216edc197d83d6c9a43f80688599e62076 --- /dev/null +++ b/3b_layer5_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654454d5c86f9a1fa8237666d07b68ccb060eeef50555c0b3b4f1c0e6c57c24e +size 133391953 diff --git a/3b_layer5_self_attn.v_proj_input_pretrain_representation.pth b/3b_layer5_self_attn.v_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c19592a80ba864c9416a92ee31d472e787875451 --- /dev/null +++ b/3b_layer5_self_attn.v_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88352653bb4004af3e647c7457a1bf1e1d173cdea7a4396d4721fa14fb851e36 +size 133391953 diff --git a/3b_layer5_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer5_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b14a7cf93b69fae058025396af9b6481ed849278 --- /dev/null +++ b/3b_layer5_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec5a34a1f7b001d015d5daf344374704f8e1b07e68631804f8371962c670366d +size 33349206 diff --git a/3b_layer6_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer6_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..57d39827ae24b033abec6fe07cdc35642d20dd8e --- /dev/null +++ b/3b_layer6_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd7f75949930bd67850c394e230690fb59f3a37c51df5933f763a17ce8fe27d +size 133391958 diff --git a/3b_layer6_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer6_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..43e9a021cc30a27c17fc7986aeeeab6150751c79 --- /dev/null +++ b/3b_layer6_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e37710cf176b7f8769d641e0ee7efa02414ae1e1d56e2df6e9bda68fcb91d18 +size 133391958 diff --git a/3b_layer7_mlp.gate_proj_input_pretrain_representation.pth b/3b_layer7_mlp.gate_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca5ea9d4665788f4c05f99f01d054dd7081befd1 --- /dev/null +++ b/3b_layer7_mlp.gate_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef868c5f9e19e128760750e73f1634ec04173d7db217c07dd1101819e6744ce9 +size 133391874 diff --git a/3b_layer7_mlp.gate_proj_output_pretrain_representation.pth b/3b_layer7_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1be4245f6ea48e385bdb59cc5fb0b0fd018cb0a6 --- /dev/null +++ b/3b_layer7_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1475a179920b30cce154b84950121705a67797daee3afbc27cd587302b98a242 +size 533562951 diff --git a/3b_layer7_self_attn.k_proj_input_pretrain_representation.pth b/3b_layer7_self_attn.k_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2a0d738a033d02ba3fba7590a2698c6b309dde2 --- /dev/null +++ b/3b_layer7_self_attn.k_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7473cbfafdf430537d8572f13416eaf98d84b5658c3508f14e2ad8e09654a522 +size 133391953 diff --git a/3b_layer7_self_attn.o_proj_input_pretrain_representation.pth b/3b_layer7_self_attn.o_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2ad1a2153495d51088fd6a1c46c71b2fa434804 --- /dev/null +++ b/3b_layer7_self_attn.o_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e06efdb475ff31a275d0bd7e84b1738aab8b86dce7a7c82e2cb07b13b17e5ee +size 133391953 diff --git a/3b_layer7_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer7_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..edf8dd6e06b225427163614f93288757318869ec --- /dev/null +++ b/3b_layer7_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ea073a04b7cc76c554ca97dfb91d83bd2c264cddd0cadc028f73a6074fc9c7 +size 133391958 diff --git a/3b_layer7_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer7_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..488cd47df2000f3a3b63cd314ed97bc0c6272489 --- /dev/null +++ b/3b_layer7_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7395dace94e0ff7df79fc5e32472ebb5b33f983a9c44b5e2c91f6c9229a75847 +size 33349206 diff --git a/3b_layer8_mlp.down_proj_output_pretrain_representation.pth b/3b_layer8_mlp.down_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..42a307f17ff8e4f44e49ecbc801fdc25a72a2276 --- /dev/null +++ b/3b_layer8_mlp.down_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544dde4e39536191e36032b2e8d884ae2ecc28356f769db373a8dfbd922e7727 +size 133391943 diff --git a/3b_layer8_mlp.gate_proj_output_pretrain_representation.pth b/3b_layer8_mlp.gate_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..35080f0ebad547e06956c4659eda5af6511a510a --- /dev/null +++ b/3b_layer8_mlp.gate_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016221d41702c5a182b780f59bec09c8db7efce544ee5fd83aba9a7a7684c3a4 +size 533562951 diff --git a/3b_layer8_self_attn.k_proj_output_pretrain_representation.pth b/3b_layer8_self_attn.k_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c2fc4e19f81052418c9bc5938b8366072371d67 --- /dev/null +++ b/3b_layer8_self_attn.k_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3683bb4a9b8e59cbcf1016bcd05939cac9f57fdc6807fb8b739b26d63749f927 +size 33349206 diff --git a/3b_layer8_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer8_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e1278492967ab3ae53cc91722957e29668fa5a3 --- /dev/null +++ b/3b_layer8_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8c73913801e6f8aab86667d6794b387423080a2d9ce6825370fb689e1ee4f1 +size 133391958 diff --git a/3b_layer9_mlp.down_proj_input_pretrain_representation.pth b/3b_layer9_mlp.down_proj_input_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f8679fd77c62a5430db6435fa84655f8fa9f39e --- /dev/null +++ b/3b_layer9_mlp.down_proj_input_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5171d487497ce7a3762cf747169c3ccf527dd7647a26a8098976dd8a95b467f +size 533562882 diff --git a/3b_layer9_self_attn.o_proj_output_pretrain_representation.pth b/3b_layer9_self_attn.o_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..185933118f858442fdd9bccac511ee4db8ff906b --- /dev/null +++ b/3b_layer9_self_attn.o_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a281bd5545ba618fca63c5d629d483b21046b10476f26bdfdf912ce35e43d613 +size 133391958 diff --git a/3b_layer9_self_attn.q_proj_output_pretrain_representation.pth b/3b_layer9_self_attn.q_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..212847ecb2ef69dc77fd42b8c4f3fafabd047348 --- /dev/null +++ b/3b_layer9_self_attn.q_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e903248f3fb906085bd8dcb95e9a5f19db6ddfa85748730e934f500dc83e94b +size 133391958 diff --git a/3b_layer9_self_attn.v_proj_output_pretrain_representation.pth b/3b_layer9_self_attn.v_proj_output_pretrain_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2e1d044836761410c3bfddf8cc5ad6bde9f5826 --- /dev/null +++ b/3b_layer9_self_attn.v_proj_output_pretrain_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7ff79ab1b5c5ecb67babacffaa5af2b1cd329c22587524d7948df69c373f31 +size 33349206