diff --git a/README.md b/README.md index 91bc16b0ff99fd514579aed17e0d786192e372db..97db863362d66284aff2c2bbd2c9b8baf27edba8 100644 --- a/README.md +++ b/README.md @@ -11,9 +11,9 @@ tags: Self-contained browser BitNet export for the AgentKernel Lite chat model. -- Source bundle: `/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000` -- Parameters before BitNet packing: `110885888` -- Final eval loss: `1.6545211980098127` +- Source bundle: `/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500` +- Parameters before BitNet packing: `113507328` +- Final eval loss: `0.9985759307940801` - Browser entrypoint: `manifest.json` - Runtime: Model Stack browser BitNet WebGPU encoder-decoder with packed BitNet WASM fallback - Tokenizer: AgentKernel byte-level BPE attached under `tokenizer/` @@ -21,7 +21,7 @@ Self-contained browser BitNet export for the AgentKernel Lite chat model. Web app route after uploading this directory to Hugging Face: ```text -?modelStackManifest=https://huggingface.co/PeytonT/agentkernel-lite-100m-bitnet/resolve/main/manifest.json +?modelStackManifest=https://huggingface.co///resolve/main/manifest.json ``` Serving notes: WebGPU is used when available; Safari or other no-WebGPU browsers use the packed BitNet WASM fallback. Large model files are fetched by the browser and cached by the app. diff --git a/agentkernel_lite_browser_bitnet_export.json b/agentkernel_lite_browser_bitnet_export.json index abab03bdd40888459f1add2c5f71db6a1fd0492c..20ab930dfc1ceaaebd3f28cbb8b12a7b456576a3 100644 --- a/agentkernel_lite_browser_bitnet_export.json +++ b/agentkernel_lite_browser_bitnet_export.json @@ -1,10 +1,10 @@ { "artifact_kind": "agentkernel_lite_browser_bitnet_export", - "dense_tensor_count": 42, - "device": "cpu", + "dense_tensor_count": 43, + "device": "cuda:1", "format": "model-stack-browser-bitnet", "layer_count": 109, - "manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/browser_bitnet/manifest.json", + "manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/browser_bitnet/manifest.json", "max_seq_len": 1024, "model": { "activation": "silu", @@ -14,6 +14,7 @@ "d_ff": 2048, "d_model": 640, "dtype": "bfloat16", + "encoder_position_embeddings": true, "head_dim": null, "kv_cache_paged": true, "masking": "build_causal_mask", @@ -38,7 +39,7 @@ "version": 1, "vocab_size": 8207 }, - "output_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/browser_bitnet", + "output_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/browser_bitnet", "quantization": { "activation_quant": "none", "modules": [ @@ -157,10 +158,10 @@ "spin": false, "weight_opt": "none" }, - "size_bytes": 69709811, - "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/agentkernel_lite_encdec_manifest.json", - "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/model", - "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/tokenizer", + "size_bytes": 80235516, + "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/agentkernel_lite_encdec_manifest.json", + "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/model", + "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/tokenizer", "tokenizer": { "bos_token_id": 1, "config_path": "tokenizer/tokenizer_config.json", diff --git a/dense/dec_embed_weight.f32.bin b/dense/dec_embed_weight.f32.bin index 62b9f2f16ae2600c3c59b18655e005d9e268e936..989775d5f09ae65c31ccc4acfb36659942d63541 100644 --- a/dense/dec_embed_weight.f32.bin +++ b/dense/dec_embed_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f4e6de1db97417c8e97c5e715dd064b5c33c9e94702ac758166c94c5cef61da +oid sha256:78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df size 21009920 diff --git a/dense/dec_norm_bias.f32.bin b/dense/dec_norm_bias.f32.bin index bea97b3d9b09f474e70b0e909bb475ac26705682..e5f59ec891e3b5b2de2de42be6be6638a97fade1 100644 --- a/dense/dec_norm_bias.f32.bin +++ b/dense/dec_norm_bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5a504281bfbf8814d71a0347d2f1b29da2384360eaa32e344ff7056e112b4001 +oid sha256:a52ba99331e084971ab8824584f8d5e7b308f7f6d5856c6732f8ca9e93e28cf6 size 2560 diff --git a/dense/dec_norm_weight.f32.bin b/dense/dec_norm_weight.f32.bin index 13a2b67b075e99ba8c0cc4ddf8d22bb5c7dfe282..8210cca7c9278d91a9eaa89ae451ea93d2116081 100644 --- a/dense/dec_norm_weight.f32.bin +++ b/dense/dec_norm_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:39fa6364f4ec83f1fee8ad937aee196331d07d86c987e3c4aaea1d78001cb562 +oid sha256:88a7e373f37f1a051e48de5aab9429ae16992571a5ee4536db1babd73dfe3e69 size 2560 diff --git a/dense/decoder_0_cross_block_n1_weight.f32.bin b/dense/decoder_0_cross_block_n1_weight.f32.bin index 7214301e80bd2c0d8b5604a708f4d80c31550acc..52a361c41424f056f3441059d4956b3a3e6e41b5 100644 --- a/dense/decoder_0_cross_block_n1_weight.f32.bin +++ b/dense/decoder_0_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb1544f5768be6328f6561e7149399a50d6f25a523d6c9b18eb44e92546fc5c1 +oid sha256:e9c937f04235c2be29c729ccb28cdfb4e3bca8356921b61a022e0607831129be size 2560 diff --git a/dense/decoder_0_cross_block_n2_weight.f32.bin b/dense/decoder_0_cross_block_n2_weight.f32.bin index 366208b9a49a65c35748d523ee196fd41b053190..fbf0904be2bb70ea279728642661087afbe3b452 100644 --- a/dense/decoder_0_cross_block_n2_weight.f32.bin +++ b/dense/decoder_0_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:076f5ecc86169fc36943250486b0081df382202af90259ffee7072fd74123fcf +oid sha256:78579439b641dd9fdd660faa7775d54b5e3b73274a8ffdbd7c627711063d1d9b size 2560 diff --git a/dense/decoder_0_self_attn_block_n1_weight.f32.bin b/dense/decoder_0_self_attn_block_n1_weight.f32.bin index 4f504b9e229f617af2b07b2a67ddd67684fa3f47..2ecfbb55ac9deaf6026efdabb5725cb0ebbc2d7d 100644 --- a/dense/decoder_0_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_0_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fdcf9066e761f2f195c430f007594e21aa66f1234c0b85328040f9e7e554dad3 +oid sha256:c2e362ce5f59f6f6086843ed701ad3d3dfaec44f641da7a2be9fd16e0be21c62 size 2560 diff --git a/dense/decoder_0_self_attn_block_n2_weight.f32.bin b/dense/decoder_0_self_attn_block_n2_weight.f32.bin index 61036a5c7892d3cacd740b9879ceb7e6a30dec68..2ef3902fd80875584043b3093e77d53de2e4204d 100644 --- a/dense/decoder_0_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_0_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6e74eda63198e8b627cb92dbf9ccacca9f96deac1a7d2c476d4b6cdbb9dd35cc +oid sha256:ec08bf70a433d42cd2eb3a285a8612deead826ed83e7e4f35a39cd7ce353f041 size 2560 diff --git a/dense/decoder_1_cross_block_n1_weight.f32.bin b/dense/decoder_1_cross_block_n1_weight.f32.bin index 5bffc7cec3f9f06b0ee5c3227ef5f75c364cbaf1..72eb31df4358e872e4a7ae12896194f29db89522 100644 --- a/dense/decoder_1_cross_block_n1_weight.f32.bin +++ b/dense/decoder_1_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e5ca042ac675538a09d1f203f5612ddb70ce142851f2a7230072bcda2f90e4ee +oid sha256:5ec1779722dc0fda7f204111f658f2977944f145389cb41b4dd7e43bc8eb3293 size 2560 diff --git a/dense/decoder_1_cross_block_n2_weight.f32.bin b/dense/decoder_1_cross_block_n2_weight.f32.bin index 8107a485b3d88ebc83e18f91412ee64203bdf28e..6901e4e722a90b429e8391280f3e36f2367c75b0 100644 --- a/dense/decoder_1_cross_block_n2_weight.f32.bin +++ b/dense/decoder_1_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17201b47c33c425b4e205726a1dd0160224d21a7816a27b3cb2482936373dde7 +oid sha256:e63f46aee081e5e0c9d914cf5a63990a7f8cdf18d69d1c9e3bfd5dac3f529414 size 2560 diff --git a/dense/decoder_1_self_attn_block_n1_weight.f32.bin b/dense/decoder_1_self_attn_block_n1_weight.f32.bin index 5e5630e58e616d221bf942c3651970810667d849..c65c7fc097eabc40fd07284f2bbf01a3df5586a8 100644 --- a/dense/decoder_1_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_1_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:91b80f1512d95b8b638e62d76ca66106598d2a41de988d6f8403bb16bf8fc4b5 +oid sha256:bf626ce4b9540732ae4b0e41e6ecf8df9d37aef2c0f7835fe82da74e8f8350a9 size 2560 diff --git a/dense/decoder_1_self_attn_block_n2_weight.f32.bin b/dense/decoder_1_self_attn_block_n2_weight.f32.bin index a9a23860107398aa3e27dfd56781a83d81c5deeb..b1b9637d71bd8ec50371e03dfcba45bfa1da2819 100644 --- a/dense/decoder_1_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_1_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d7f5387a2d28ad4f6e0ee3b902c0e0ebb6ece2960c479f6591f1cfeccd1bb3c +oid sha256:19644a427ac6450eac03f470c361290f3d1045900726fcea28a9973373b5c76a size 2560 diff --git a/dense/decoder_2_cross_block_n1_weight.f32.bin b/dense/decoder_2_cross_block_n1_weight.f32.bin index 52bf250df3b0b6bfb11a2f00caa202f8a37505a1..fd62dd85bfb90d68087d927065d3ca9968f7df47 100644 --- a/dense/decoder_2_cross_block_n1_weight.f32.bin +++ b/dense/decoder_2_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6cf4842fcdc048c1a9115fb862bf401bf0504315cfd8afd393ee98ec614393b0 +oid sha256:86e9c81d560b6bf1d1ad5b41f54e516e751e97f70c874b0c9adb6fbf61914c3d size 2560 diff --git a/dense/decoder_2_cross_block_n2_weight.f32.bin b/dense/decoder_2_cross_block_n2_weight.f32.bin index 65183d19387b1f4ebb7303a975ab9b245e4db052..9c23f7ce76ca1bf4516187a44ea996e71e0b67d0 100644 --- a/dense/decoder_2_cross_block_n2_weight.f32.bin +++ b/dense/decoder_2_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:803b8acfc59c8244383517cb942b6e521be21bb3066a7de0ed452bbc49312fef +oid sha256:3a71a2d3f2600a26735b357ddd3a4958bd4590964d149155f1c2167089349d9a size 2560 diff --git a/dense/decoder_2_self_attn_block_n1_weight.f32.bin b/dense/decoder_2_self_attn_block_n1_weight.f32.bin index 319d102a98f3527a147be4c53086c496ca3a3a42..86a3a8c71c5ce60d1b473d2ef377e031b6561237 100644 --- a/dense/decoder_2_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_2_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ba167f943b727d733c4460cbd347a4e7a2e7465d6dbd94d2bfc011935a1a9bb9 +oid sha256:3ac4f3b079f383cc503850ddc0a18679c166364488cd12cf5521d9e1c5baaf34 size 2560 diff --git a/dense/decoder_2_self_attn_block_n2_weight.f32.bin b/dense/decoder_2_self_attn_block_n2_weight.f32.bin index 250584fbd53808b2fb0c42353bfe15bdae5f03ba..fd31cf1f40e8d5c584001ce64a6137fbd5be2ea0 100644 --- a/dense/decoder_2_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_2_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:31d621d52ff0754ff33599bf8d85762a7458dca818ddce1c93310648f2b2a5d2 +oid sha256:8ef13c495f661d19e234362142100d58912a517f4d290dab698282de1821ab91 size 2560 diff --git a/dense/decoder_3_cross_block_n1_weight.f32.bin b/dense/decoder_3_cross_block_n1_weight.f32.bin index 085d6af35b609357680b41edc8930da54fe00d88..94ea36636c11069c5651df380499cb39fa198eb2 100644 --- a/dense/decoder_3_cross_block_n1_weight.f32.bin +++ b/dense/decoder_3_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:40264c9a18a77c788d5230f95c0de43f008b8f846a0be466a875f260b2b5b057 +oid sha256:9ae1fc97c13441dddbbb3e9eb5d47198a3d607c88ec4e43c93d2c81bde27b4d2 size 2560 diff --git a/dense/decoder_3_cross_block_n2_weight.f32.bin b/dense/decoder_3_cross_block_n2_weight.f32.bin index 9afc510345dd61314c009916bd783a0b2a1fd665..2fe8a8a1b1f37c3ef0beef03bd9cf116a5fcca94 100644 --- a/dense/decoder_3_cross_block_n2_weight.f32.bin +++ b/dense/decoder_3_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:091cf7ee073bd6638db219adb03f4295ab68be5d7721a4a7135ab647a3d17b20 +oid sha256:429c331c002c12043871fbf215b416f2db8a1d5f79ce9431a6a907ba17eca8e5 size 2560 diff --git a/dense/decoder_3_self_attn_block_n1_weight.f32.bin b/dense/decoder_3_self_attn_block_n1_weight.f32.bin index c4ee1bf46a73d4416c3130be3ce72fdd9c83432f..4f8e697b3f127bda7c06edb7fed5d98533912c16 100644 --- a/dense/decoder_3_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_3_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2d5aed83057285fead1f0ad341fd4e45739d408df90af9b948e00d6cf672ff3a +oid sha256:4ff58a140da536f85cb1e90acc5235cd45559ae129fd770960044e4c630fdfb9 size 2560 diff --git a/dense/decoder_3_self_attn_block_n2_weight.f32.bin b/dense/decoder_3_self_attn_block_n2_weight.f32.bin index a54a1fa63a33497a208837eaa0651c96cc738481..534f5a6a9ce5b7ae00002b420e7ddb5f3a27a122 100644 --- a/dense/decoder_3_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_3_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:addf0c1c46f80b69327ed9ba9d291fc0ac3f8f46b1d32430a0550fcfbb9bdf81 +oid sha256:de3959c7d087a5d74e7cf13df2097222754acff9efb0d2f661578d10ddd176a5 size 2560 diff --git a/dense/decoder_4_cross_block_n1_weight.f32.bin b/dense/decoder_4_cross_block_n1_weight.f32.bin index fa262da087f8b7c7dce67a21a6b512f28239d1ce..67576d07529913d093a75bdee53dbef26404c949 100644 --- a/dense/decoder_4_cross_block_n1_weight.f32.bin +++ b/dense/decoder_4_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:622fd2c7811caafb6ec4b6672cdb77d6b1a2677a86156c8787c7e076af8ad2b6 +oid sha256:b009766fbf166bc3f7a0dacd2d9a161fc04e586c117a836ce0ebd9fa1ca3ec6f size 2560 diff --git a/dense/decoder_4_cross_block_n2_weight.f32.bin b/dense/decoder_4_cross_block_n2_weight.f32.bin index 28bab6acdc474a65333085e13a980801a0020601..ea2d17320a804c5430d857aa5e262f954761b70d 100644 --- a/dense/decoder_4_cross_block_n2_weight.f32.bin +++ b/dense/decoder_4_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df5cba19f68c1688c76c00ae547fd4417319068557d1ffd631fd306c774c735f +oid sha256:d40db0671193777c76f5cb7dbdf13f7545a871771b35b770dadd31ec7e825b7c size 2560 diff --git a/dense/decoder_4_self_attn_block_n1_weight.f32.bin b/dense/decoder_4_self_attn_block_n1_weight.f32.bin index 9d2fe5dca25339b7ab0277e6644d856983140eb4..b453b1aa33d64499690ae8a4316c6c43c3ddb815 100644 --- a/dense/decoder_4_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_4_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:36f463ae849c04e510290002b2baf5b6852b7f388e8e75ee98365ad3d8a12764 +oid sha256:74d5d626c5d30fbcb004d3b9cccdcb680d0dceac061d3c9ad3e3367a478daeb6 size 2560 diff --git a/dense/decoder_4_self_attn_block_n2_weight.f32.bin b/dense/decoder_4_self_attn_block_n2_weight.f32.bin index e1c3bd7e52134fa127fba20bf4aa8f8e60018991..f65d51f886ea2d41a28c7904bbab528ec4656ebc 100644 --- a/dense/decoder_4_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_4_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2e36fb000644e19c7de577abdef101e67362cec1f4866028d06494320f770617 +oid sha256:ca807c21a8be5611a6f3d26636658cc23b0294f7a5372f3b1a4e3552a31cbdb1 size 2560 diff --git a/dense/decoder_5_cross_block_n1_weight.f32.bin b/dense/decoder_5_cross_block_n1_weight.f32.bin index 6b206a0c968872b7af7109e43e995a4cc8e12e0b..a527202b51d68ed3d828fe8aac5d04b4aa455361 100644 --- a/dense/decoder_5_cross_block_n1_weight.f32.bin +++ b/dense/decoder_5_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:44104d135d3013adbd3b9cfd7245f9c2567d998d3417cd8f5588bcbc34e2996d +oid sha256:0a7029d09d53f7812b45876923a3267f322dc1f873bab81b4099f72c1eb29f46 size 2560 diff --git a/dense/decoder_5_cross_block_n2_weight.f32.bin b/dense/decoder_5_cross_block_n2_weight.f32.bin index 06a51706521e47dc9f288f2c9cf2788c59d71f2a..0c0a30e620ef811cd1c49923d4bcbe5586048d23 100644 --- a/dense/decoder_5_cross_block_n2_weight.f32.bin +++ b/dense/decoder_5_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:46f24a5c1006acec251c6615268e31cea8682feedf76839fb16cde44f4fde5c4 +oid sha256:1539fa69b705976b0158b27c31a421b0103398f5b7d938e1dec79c871eeedfd3 size 2560 diff --git a/dense/decoder_5_self_attn_block_n1_weight.f32.bin b/dense/decoder_5_self_attn_block_n1_weight.f32.bin index adf288d8ea62ecde7cd27befab0344364f6d1a91..0f4161caa9581476b287281ee81161c67636395d 100644 --- a/dense/decoder_5_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_5_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67b346c953e25cd41b9f5ce533d93e3c3bd5869505b684be203c676d7b7179a9 +oid sha256:5c5c49ebf225953e7a3c584cd779e73c253e11f01ff26749229b9c9b47cc6a41 size 2560 diff --git a/dense/decoder_5_self_attn_block_n2_weight.f32.bin b/dense/decoder_5_self_attn_block_n2_weight.f32.bin index 2302ef939c99227e637c79a8f5b4eee5467316bd..c9f902d93af5f77922434b22b6087251dc5fc70f 100644 --- a/dense/decoder_5_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_5_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:451996b77d575d3d1d40c5e1e9d96c24448c93d039999b91d132b7d4b37a001c +oid sha256:7ab9b449fdbfc619624903516d79e6f920b50c2ceb15d14078c3782b0a4f3f49 size 2560 diff --git a/dense/enc_embed_weight.f32.bin b/dense/enc_embed_weight.f32.bin index 62b9f2f16ae2600c3c59b18655e005d9e268e936..989775d5f09ae65c31ccc4acfb36659942d63541 100644 --- a/dense/enc_embed_weight.f32.bin +++ b/dense/enc_embed_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f4e6de1db97417c8e97c5e715dd064b5c33c9e94702ac758166c94c5cef61da +oid sha256:78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df size 21009920 diff --git a/dense/enc_norm_bias.f32.bin b/dense/enc_norm_bias.f32.bin index 514a250e68ba0446b02f30878459c476f36eceaf..1174610675f6f6153ef9433e7be3c3cd8a71ae45 100644 --- a/dense/enc_norm_bias.f32.bin +++ b/dense/enc_norm_bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3137fc19f4ff925c8811da6be650c38698d307578e74cf3757fd3607a0be0c29 +oid sha256:73c7b6e76072acad2244afc73657d29377fd189a8af9bc41daa14aabb346606a size 2560 diff --git a/dense/enc_norm_weight.f32.bin b/dense/enc_norm_weight.f32.bin index 2b94fdccb5118766801d7a46d4d1a10c37c84949..cc9c7179c558281858559d09d4a2d2ac85bf1aa1 100644 --- a/dense/enc_norm_weight.f32.bin +++ b/dense/enc_norm_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d08173a24ed7c4e20a10a518254f215886e33efcf83e185160a4c033cf84ad4c +oid sha256:fbce78fa3910cca15c0bec29f929009612f7f5b94d1d083771ed0b114bb2a337 size 2560 diff --git a/dense/enc_pos_embed_weight.f32.bin b/dense/enc_pos_embed_weight.f32.bin new file mode 100644 index 0000000000000000000000000000000000000000..570e24ddcd3c1749e30d118291338c6af4e5efc2 --- /dev/null +++ b/dense/enc_pos_embed_weight.f32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e06124cce8055432e8e6a7a9a9a2a6e39ac672071f23dea5872bd19c51e4d9 +size 10485760 diff --git a/dense/encoder_0_n1_weight.f32.bin b/dense/encoder_0_n1_weight.f32.bin index 48ec54b96329b973a3ca7ad430babdb0df291dfa..bfe3df8fa1f30c6b817595e1e2c167b5477c082e 100644 --- a/dense/encoder_0_n1_weight.f32.bin +++ b/dense/encoder_0_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9dd433b1403ac0fe16541c304a42d3e67b0b2cb32b47e872ed0be569596e6e66 +oid sha256:146bdd3c5419ea957cba0919904c3fa3a18345399e1190e38b1697c5bc56a18e size 2560 diff --git a/dense/encoder_0_n2_weight.f32.bin b/dense/encoder_0_n2_weight.f32.bin index 073555d4fe4542b21e7855af79b5c9e10dba5382..d9827eda87b4e8974da478bc04cbc15bf8bf86a8 100644 --- a/dense/encoder_0_n2_weight.f32.bin +++ b/dense/encoder_0_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9d33d04a66bcce116bbd0bc6072b494a5f68c3e77f69f0549326f66a75c68b5e +oid sha256:2817160dc2b42d5f8de29fb566ed4165dff109f084f8a5af1766e544a7fea509 size 2560 diff --git a/dense/encoder_1_n1_weight.f32.bin b/dense/encoder_1_n1_weight.f32.bin index af5ba88deb07c6edcfe67069294c02edc26a505d..56cf81d4203ff908433209e35729a3f93771d91d 100644 --- a/dense/encoder_1_n1_weight.f32.bin +++ b/dense/encoder_1_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:177e15460da20c7b1452c39daed8b193781de5a7723a82eac4b9089897447a18 +oid sha256:4b3b5cbb90b337e7c217bfe73872429a99ef7aaeda0743a01e7c78b496abce08 size 2560 diff --git a/dense/encoder_1_n2_weight.f32.bin b/dense/encoder_1_n2_weight.f32.bin index eb1725d52eec74bc04b8da06084d7393ebdff4d8..c0eb4495f190f58ba91204c285fad3c458076032 100644 --- a/dense/encoder_1_n2_weight.f32.bin +++ b/dense/encoder_1_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:99cc691f53f600e90d3f636f673359af993b1f2f2ce259f7dcb61d6d1647fbab +oid sha256:2030393e0c8cc4554a10187e03f03e541a380227d3b64c3f6455aa23d8295be6 size 2560 diff --git a/dense/encoder_2_n1_weight.f32.bin b/dense/encoder_2_n1_weight.f32.bin index 754c84479ea7c6ae84860fead8e9c865819b5202..0eda91b2903b1d9f1fc84ed7915f043d16dc51c1 100644 --- a/dense/encoder_2_n1_weight.f32.bin +++ b/dense/encoder_2_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84cea3917081531f374901364d9a36691227083d011ac1364e01c8b1866b2ac2 +oid sha256:203d16e2f34a9fb6059e24d8bde0b3d2e85e8edbeaecb2eac7c647b9c81f1dde size 2560 diff --git a/dense/encoder_2_n2_weight.f32.bin b/dense/encoder_2_n2_weight.f32.bin index c2d00b0a273b658ccf879a49ac5cd549677d7eaf..908ff35f29dd10ebdc88b85e2726195662c765ea 100644 --- a/dense/encoder_2_n2_weight.f32.bin +++ b/dense/encoder_2_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f14762332dbb644ff274586a0ba82af4be2c4cdc469d31e166d488044c9dd35 +oid sha256:a223438f7de8e65465b9c95605748e0152bc1b92d77b72d3af2a41d9ff108927 size 2560 diff --git a/dense/encoder_3_n1_weight.f32.bin b/dense/encoder_3_n1_weight.f32.bin index 18b49ba81ac4a9172c029e56da411f7c6e065cb2..b85d1397db1b0f983c31c817a3266aa85991e722 100644 --- a/dense/encoder_3_n1_weight.f32.bin +++ b/dense/encoder_3_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1abb733c2331d9145ca33290b207dbbc6dc15053f56aaef9b659df4662b0eb41 +oid sha256:6f97f7dc429e26a0e2950787e5ec7c9fa3c3ab9b8ddd0fc1279c19908fdb9868 size 2560 diff --git a/dense/encoder_3_n2_weight.f32.bin b/dense/encoder_3_n2_weight.f32.bin index b296e33ea5074440ff27de59f3f3248638676923..93b047e41e67d50a7a06051f71b2229c46fadad0 100644 --- a/dense/encoder_3_n2_weight.f32.bin +++ b/dense/encoder_3_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4c7407197d1d85e0693f4056925b029929bc471f659557c9a39f0383f6cd3266 +oid sha256:9754f40fc928fdca4359684c41888d1b3d6af817936af59b161f3824b32534ff size 2560 diff --git a/dense/encoder_4_n1_weight.f32.bin b/dense/encoder_4_n1_weight.f32.bin index 9e9ff6de7f25a62fc45235bdace87c6e4ba9f64f..6767761c92eb82f978cd16220ae11176113c7b1c 100644 --- a/dense/encoder_4_n1_weight.f32.bin +++ b/dense/encoder_4_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb44b4546a957ecc9b8f8c70b985fdd04cf7b634d3b1ebd4aef456387beb683e +oid sha256:2195f562646510d2e377c5d219dc1341d32001ed30b4d54cf754462cbcd175a1 size 2560 diff --git a/dense/encoder_4_n2_weight.f32.bin b/dense/encoder_4_n2_weight.f32.bin index 75f9b4df15cb0df79b1e7ef408159774131d1bcf..f8b83df2d8c8b5c37ad0a31a3bbdcd8f05a8cc2b 100644 --- a/dense/encoder_4_n2_weight.f32.bin +++ b/dense/encoder_4_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7626d463427ded1e6da5602867bd19a5baf2496d49c21878cf392c4acbbaa645 +oid sha256:75fda5bbfe2285970162c18ebf565ebe3e4032b2751b4bac289409a0ed8cb12b size 2560 diff --git a/dense/encoder_5_n1_weight.f32.bin b/dense/encoder_5_n1_weight.f32.bin index 9364ed73c590524581871eb6f520c80eb97f5527..725fa9930f76b9d503537e56a8d5320233437a07 100644 --- a/dense/encoder_5_n1_weight.f32.bin +++ b/dense/encoder_5_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d756e71405f5928a6ae70ef262b4237a8584a795a60eaa158c1a234d05b2bc2 +oid sha256:eb288cd1ccb8e5b7d5da5e6fa88afd881471b0bbbd355e14adbc3b885385e71f size 2560 diff --git a/dense/encoder_5_n2_weight.f32.bin b/dense/encoder_5_n2_weight.f32.bin index bd694b3a7a5a2ce0952bb4815bd792ea56c0dc14..e8e3b1bff53e8e970c4b3e22b3ba5dff8fa9c777 100644 --- a/dense/encoder_5_n2_weight.f32.bin +++ b/dense/encoder_5_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b7fc6eb738eac62a7880893a3c3f35913ae958f06eb9593942bc2fc63ba1f9d1 +oid sha256:75218ab909794e1396d0a651023851988cfea12c5085c9230b883188d3a66ae1 size 2560 diff --git a/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin index 727eaa6b72360f53116c538ff103c3f207643883..c9adba5c714961965fbd434afb191cbd929ce561 100644 --- a/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3ec4ae80b24ffa71a637d7223b360d3928124c6487a2b9d714526456828930ae +oid sha256:982b011fe87a1a8b0c2d5b4fcf645a9335e5e7e2e8a48b6983c879835a6aaa1c size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin index 3005463e6c2f13ac5d1f66879cc84c2171013d50..80b99a155e9c5ae819fc27c9b2d965e5733086eb 100644 --- a/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f39d50bf53473b96c7d6b64d06d61e07fc684226defd840191874dea5bc6328 +oid sha256:1cd84c7bf5262b70b638f322e6ea50dd15a935a42c023048e208794f1e6efe8c size 4 diff --git a/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin index fc138ca1855b032a50f56168ac3ea2a3a0fd9137..d6c220cef723d8d1b5119e3b964ca0ddf4fde7d2 100644 --- a/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e23f5fa340d288f9a9df5e568a7cc5aab98df574c8e6961c2b5e0fc99874c4fe +oid sha256:4c26e3f5b35f3698ba7cf07a90484d2898796924e1486ca1912fbe48eafe2766 size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin index a31994a14ec568d91febefced59258f29835ae81..95f384a3eaafb332b6bb76e83a9cbc93f5004d71 100644 --- a/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8298b5baf8f1af425aea4cb4f9587959d4f8c0027ff71e9681d9b99ac5908933 +oid sha256:71212803e1148c154056c46a4bbcbf62bf0924bbafaa98d757aac03cedfd9dd4 size 4 diff --git a/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin index 804aeafdb12a60209537c4e799619a91faa32ad4..a1b0b6352ad5a40b38d22efb5512f8bab2bc2bc2 100644 --- a/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:827dce8c453eafc2a1a5f73a75a2c6b7146b867b4c1e134609175df6cf4cf101 +oid sha256:97f87a393223a02090729500d41370d7d7d30a269b7710c919abfc48e7c008bf size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin index 98598ed997b8bba5920b710d13a60179370292c5..5d6c6986ac56a5f8aeba84c183ec7bf622485140 100644 --- a/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:87ea67f73d751bedaa48a82d1ab55f6824ab8136e2e91b9d610662ca8601e763 +oid sha256:9b6668ebf77529a1006886dfc7dd0a74b54b295645cd3c7454c113143ca5a575 size 4 diff --git a/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin index d23296743abec4653430ef544ef8f96414fc7d66..722fdd7d2b5311c9ed51f737f7549d6ea1b651db 100644 --- a/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:73817a906cee71e8294c20ddada43956137ea65cb78d2d8eabcf7ac10e060a54 +oid sha256:1d14b3c5a2c23317ca7d3d144bad570d637b047b55b7a815621ab8fc8ec603db size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin index 3b15a1e065e4bb8350c91f626e0352695214059b..3b2a3c20278c45a4060ca1a5c5a3e559d6898b14 100644 --- a/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:50c5f27dd38fad44d2d2ea50443fd9a6c50a187cbf389b3983179cc5f64d83bb +oid sha256:e7afbeea361f30dea3b8b0647a08256bea9be60a1016f0efacb3af0316724247 size 4 diff --git a/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin index 314e8c359533f5878f63336e6db9cc36c4011783..3719510bb774569c61a4f9c20a1f71a222c30a07 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00d2055f715b5ebf6759aa67eaa147307789564608619b6af16afe214fadd064 +oid sha256:243bc0ff5ab70374de5611e00f881f5e6ab2e37c01585d7cc91be33710e043e0 size 16384 diff --git a/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin index 720f424f96940ce3d98a228cca82b0c6a1e25c6a..697b29c8081fd4b267af6b19e22dd83101d6f63e 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b2779b7294d7662e5869dfa1828bbd9ec56a99aa7f79f5242be287385aac92fa +oid sha256:41c4fb217a184ad7c74cccb1850851c1fec8dcf6749702f45c6f886b31434c94 size 655360 diff --git a/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin index ea617a542f6319ce65d8572478de8b29059e8e0a..df00345f580ac0c4261db7495c8c7259e2b9163c 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8dfed15a2583ff098b973bd63595871e32e73b5601fd71c0a063349da4acb38a +oid sha256:eaced36f128bb70455e0eb8d46b835775ac79a7e251254ebd2b0e6ec10378d0a size 4 diff --git a/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin index 7e37bf44c1c95ffeb33351de9791e2701649c5ac..fdc601418db15599e5f6a83ec77b490a11f0b4b8 100644 --- a/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e8ff4ab3a6c857f9460c554109293ea056e061373af980590bddd5ee2abd964 +oid sha256:93e5d268cec594d48d9e4dba6f0ffbdec30bf60c8f72614448b97c57e8de9d02 size 2560 diff --git a/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin index e530eee2f0e5bae4327944b31d62e766e7e87b49..64a5b0785185da3782724d6cd44edae2df9d51bc 100644 --- a/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d289652991a8a6bbb6306b4ac100899fb2f35c3ad5beb337a41e9163b1979f7c +oid sha256:c33677d40924532339ba17f96c7098ea6198b15280e68ed2ca8625912bd8aa8f size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin index 118c386604f5bde16465fc4e37fa0d21f407f0c9..7781270b4e46fe0082e62d0f0cf3cfd2e077de65 100644 --- a/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cbff1d78a3feeb67fca9095fea92fe40cc282a45776459fe82aa749922f4d620 +oid sha256:fb1445a194065f84f93d6fedd73113035d7beb2314d7cdf77a5731700c05ccde size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin index 437e55e65822cb7e460d2f8312bf8cbed3aeb0dd..7fed3467e6a260203ddfd3e26cd34ea1d4c5920b 100644 --- a/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3209a3fdf503c3ccdd78d46a0013a46932396b116c08dd33d5458e5b3d8b7d46 +oid sha256:65dc763995a05d919bd32c3ae62429d6ae6e5dc59d7570e9e511e617400d105a size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin index 13c6058d9fd382168054911e85edafb7f88ce4ff..b887b52541896b703e42baace30c2c3e841d3797 100644 --- a/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b81593ee5f78bff319625a598ee3a326e450ccec286f4f054c41716a7a6c44fe +oid sha256:e2f907585a66def6ac95c943ab6364491d9410323d6c2acf1e7d85f583b8cad6 size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin index ba876affc2cac331aca865479830c2d2adb5402b..2d74fa03e9794018f40cd75c414897a24558d670 100644 --- a/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:62d4c1ea8209bf8ef3c900abf620e9e98250331c70728a08ba701a897f680e97 +oid sha256:7c7233dbf0113e851ea6a854beae2f1c9ccf2871a1cc8798a07d00decccab7cf size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin index bebab73b984db04f799d7b5f6d286ea485024f53..97aded00f0ff95c5fa17109c20ad191b6d21607e 100644 --- a/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:73085bdfeea8e210e3851ad505e3ecb1a77d6dba6a3cb56452de02eaeebec1b1 +oid sha256:e7f4ef6d97be20f7ac273b0280302bf087151da75c4a2bc645ddbc74f340279a size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin index d515c3d4f4eee5b33abb26017f00d605a6872749..39a9bf01092bdd78c8d42d4b309e10c0e88759b6 100644 --- a/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:35aaf02e17f4cbf3a47587d3b8abceea4bc0716327ad1dac8e610870105bd75d +oid sha256:e1d0d0af2f97073330992aed3e464957c7f31a5196fdd8525637cfdb0970f042 size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin index 2707ad3c78513f767fd65d45951203a722c23cef..1277808e7562dd8baa316b5b65a4763db56acc6a 100644 --- a/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ead4eb1e0d6c62532a7088f16445356b1c1674a11d19e0f2c5b5fe66f18188bc +oid sha256:819396927e490b8c3959c6f006c112eb768d02d74b6b86b7afd8f7b372c1e2e8 size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin index eeeace89fbb9e3894bc98b013517f0c0fd070e41..ac95877f65bbc1f670725f9f7970c19746e6de73 100644 --- a/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c9df1445abe44f288e97f6233aab7f6bd2757d75bca91a527dab2c52b25e5cf +oid sha256:258663b01b5d4aae55b2abc15b3e8e87db4a75c52f141f4ea132b1ed11ab0150 size 4 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin index 0c118e8f899db0f4828d42d61233ebdfadb57136..4dfd12c46dc39a4a9fcbd5f1e9a2a3d6c8afa84d 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6da013727d9557ff5ea212b7d124340fd66cc6ae8324710fc48077d8b77efce7 +oid sha256:738b38445bf3e8a03e758d3c67b687f1349b33ecb802888f642e1c7b46a65d17 size 16384 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin index fa677f992717a8036d27463bd67852a2f49172d6..3f156933f4f09b486f26b2748bd0f31dc380e871 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:481bd133a5c48455630d34e2961c65d13f8aba072205c152dacc131795637e85 +oid sha256:2879daff121daeb59a75ae0cf2b8947e8591f2a94508e838311fee26485c3554 size 655360 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin index 2fc448d62e8a5b7e2307b34eead78aa58588de9b..10cda539641399871a2c0da4f0c1fee438fe7a6c 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d5c9cbece594a01b9fc12756117ac0994c4a329b9bad1a30f2160e9fc42d261 +oid sha256:b68d1acb8653e3e87271faa0828042ef37a00bfa0dcf2228db49017a23b67949 size 4 diff --git a/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin index 5bb1560028d671b330b94957a1d0ab5331ba93af..7cec65bf6b385d3b1a6b9f6b5ca4ba07f3b161ef 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d48a4623aa0453584d08f60a4c993f6ec7450c22f87d0b41042440a93909d2dd +oid sha256:e057a152b1e3b3bc1f982c0c5ac0c80853a2d0358775f9a74cd2189332b80336 size 2560 diff --git a/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin index a06f613c42801fc730cf40f0b082223ffbfbbe3a..5dc44030faed9b8aaa58b18d4a6b23eb36f15f71 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:adac014368b20fd45628680e0d18e4dbb100dba15682564651338ee0619f0a4c +oid sha256:d45c24f580c64ad0f07e0f5af42a50d887322f039d32b0b7b7aa79d85e9c3d7d size 4 diff --git a/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin index 1c55176f9165c00137b59368bfb6b28e378e445d..256be9a3a252ab1d319f22fb7a781751f834c8f5 100644 --- a/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:577097cdab5aee51810dfebfa3223a3fa586ac82e08e10c817e7bb88823e6dc4 +oid sha256:8f097d5ab440b0ba3008ce087a47bd350198dc277b19a0b82252902b4c6d16cd size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin index 9f62bf7ace711bd5dd070ddcafc2f325206d2f46..3e3c891cd62d8fbd07b205ca8ea4d2db9f585c3e 100644 --- a/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:194e3450e17003176706c9ed62806647d70744c5d5aece49e0a1932dbb65252f +oid sha256:6f9f17178c426f37dc84f6ff8c32e58375782addb3e49d98e967be1c9a4a8e6c size 4 diff --git a/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin index 0e42787826ab3cdb230206c5635e6939e3f74e4b..8c59cc8f220fb7a9029614cb26f711766f7f47a8 100644 --- a/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1647314ef6712e6dd39f2e63744b7431135dc2cceabb571950ee0769cee130b0 +oid sha256:e8466a50a9fc2ca4de15274be6b1c5339c6e0c1a3570289a576c7f4c0047d473 size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin index 6ddc7c02edbb5b6efee70f232018d3c2ed3f97fd..8618cac0841231748c45f6306bc57fd0187433cd 100644 --- a/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:57ddc9a933fecf788a1f0dd300a50b455b3698333e3e85b63332f05b9733aa95 +oid sha256:12c229bea058156dee5ebab47b585922cf4969e8cd9f86181894cf04514b2f4b size 4 diff --git a/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin index 0840b97c0f2bbd427a5bdc96ff0cf859a69ea754..4e153478a2d2c8725c653d104ece92eea5711280 100644 --- a/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c76b3bab12b71b791c49f31aa6822de42d602be8c2bf08d50435ec40616d3135 +oid sha256:2a17cca01d8239ae17510fc30457db79478b8cdc21c4b87664d82d542a68d00c size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin index 8262faf0ef0dad8c553203318c4889b1d7ad46ca..6d0fc5d5b2e1ef77291199196cd5b01179703b5d 100644 --- a/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:137fa14f376bcba4bd21d5e2041af7e66bcef81930584cb571482bdd9fddc088 +oid sha256:b28cbb207d7fd7186365278550c51df45cffb220560a46ee104e47df984ae3c0 size 4 diff --git a/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin index afe1a643aea48eab08c40ca640201ebc030d78db..d3e14a2230a3ce55cb9130068c7a380ce5cfb264 100644 --- a/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b409802e35ff1ea6ed39862aff9c220ca09e151a418b8cc3d528d12d70094592 +oid sha256:471b4a37f66a8b5583d41e02415a96aedd833d2b0b47bdec1aa8e897b2f32c78 size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin index 332b4a0bfa763d751c038332d229036efd856ac5..cdf4ae8651c39d73847765d442bc49388fc2e863 100644 --- a/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f3a918598b8fd86ea2a2e2f55ab20ab0e72a2892c37e58bd7da0fcf41b6053b +oid sha256:05a4de10024706188b2d5a60c71bf4e46da2d0a07a6d4703476f56829484beb0 size 4 diff --git a/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin index b8393da7fe08bdf8580ae656cc1675a53bed542f..49147a11cdd4ae19991356a99adb4e68c957ee15 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e6525df753e51d34970abaf8d1c40a74b796720c1db712b744e7388fef61e8d7 +oid sha256:907a4a6d6fdb011b6dd5d94b2348e9e192bd9da2dec954ff781d0a1bef671b73 size 16384 diff --git a/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin index 7f69120935cb188d625f88db7ed9011cd652ccbd..f91797d84a4c6fccdb16a477d6bb1b7d321ab727 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03f29751328c92fab31ad224f385b4be3af4d66bb7bbedc46123ada15d895825 +oid sha256:94ae5ae2753c38bf39ec63d701e65936a38bf557c6fe84fe8dff364884040e4d size 655360 diff --git a/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin index 461734afd373d35607a493b5d8fc89c7d6ea3f4a..a5c99a04d3aac10f94b3b42b9ded2444a4c2e218 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0168260e9d02616ac57d771b85b06f96d3c8ca0b1801b4d8f422d715f32267ec +oid sha256:30d23be49820704681a3c9e803812639359b86604eb64e30a85bb2db26f71580 size 4 diff --git a/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin index d19f598fb2a2e1741cc2d7c73712d7f24357a280..a11069119aca721e45fe2e626250b48ce7305a77 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:779ad3d61df709063c357c15661555fb95c87cec16cdc5e9d9a4be9e4ec5cce4 +oid sha256:b2d3870652a5e125759e95b9f86733e0bc5f77d3f6a5cc411bcaa3fa566f3f0c size 2560 diff --git a/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin index 87e5ee8fcfa292a2e038b6847a75e2d210833a96..4100a2a4c40c0f97ebd598f9aa3e4bb317fee70c 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d4a9f2dfebe2c7cc447debb622c90c0cb36b63148a2634d34e0d6fbdd0112e3d +oid sha256:a83bfd0b689cf348764bc0360cf4408087f5fd10d81d8ba0df42986478fbfd59 size 327680 diff --git a/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin index 3f3944a7f407b3903dd079ecd1b84310665769fe..f7669aa9a09b9c99e6dd9bc5f367cfb0b9c36af9 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1927215e4fa03d29dce248987860d1bfd75b9564af190b51e15e766bfab1d921 +oid sha256:16271011077b123cf1c809483461077673a1b0ea531b4b1c7e3279a9ecbeaa4e size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin index 5054b0453efae8bad0191e5f716b12cf348496f4..cb6528edca42617744d5a5345c54f399d524dffd 100644 --- a/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:48a1d4bb988a8c29875b8ab2d6c68b35b3d85ab70805536da149816d2d905533 +oid sha256:3c208fda9770ebca77af78e09a330a1fa8c11e9be00f68661e966a68a0ccd48b size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin index 9772640b010c0c0849f144641e64a04bc1e037b4..05835a27c3954002ffcad03b6c634418b863ce17 100644 --- a/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:748fcc632ef97bc835054dad79fdd28617c717337ad6634c8739aa30ff8f9735 +oid sha256:858f9e7559d0bb7fa3898567404a3201cda67a783485e1a3396fdf3e3b795553 size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin index c3c6b35dec3de4a89ea71df1a51b60af239fa4fc..3478e615b6f24e47b473c5642ea7f2b405ea1b5d 100644 --- a/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ff3d352a5e8801005b686799c2b163747ac4a997932bbb835a0d495015e8f37d +oid sha256:8130120224c1be33e2655bb591eaadccbb788a00d7394160ecbeb705144a92e6 size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin index 2428d0935125d084b9dfdac4259ba467a34d529f..5f36d9dc01d115e801adcc31df04c62c0e5da6c0 100644 --- a/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f5e4618fdc385f02530541d266b2e95d8432cae68eee49ba7284194bae2b6f5 +oid sha256:4c16a2df92ac54a79278c22bc3b52537301a6420a746ce41f227ca99620c8ff9 size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin index 5523ef33e8b4e6b991a6559a40b7522c7ffba2eb..f1475adde8b51af692679a5404d79a3730f7d399 100644 --- a/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e51312cc484dfd598c10b167dbe6af940d013b5aa895d68abab0ab1ddd423d40 +oid sha256:bcaa3d82054320aee69a8fd250931d0f7769850b1b400d9cabbaa255363aa82c size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin index 2e0c9c902e7aa6217feb19e936339991bb11eb7d..ba64c0f5012b52b85e698b235c2427b719ee91df 100644 --- a/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cee5a232daa2cac8d840a8a5d0710102daa58b71fc593bef0d596bdad06d3423 +oid sha256:ca2201ef58bdbde2cede29914dba3c64d4d39d0ebeff16d113af8159ac009a40 size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin index a7746aef329f5e5a7f67e18a3ec37a9e983015da..21b3630998a7ce648f18383bb099d9a9c3604c11 100644 --- a/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e474c856099c6bd35589e0f8b44adc02cf84b23065f9ba12ed2cde5cc9b8aa6 +oid sha256:03e84f866c79214ef48ef38da73e63d1be13e26bfab9d4650683bae5cce3a6be size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin index bc816c85b98795069b210d051abdd5309b025cf8..f2febbbf4a566b98be3e14fb654156273ae6b849 100644 --- a/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bfe670f9f0bc7d426d00b6397e8b6cf6845c80ca0de48bbe3a49a55ef9f36b64 +oid sha256:e3b03dfeea5a4d388630b3b2851b6108a4ca1a1c79c79840fc0c581906782179 size 4 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin index 09cd32aba0cc79a14018a4f213158df51fcf2e63..137f7e50c056898fddf8c4565849844e670de8c7 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b7bedecafd00ab28da70dd1d41a643953d459aec0d48a0def292a86285947cf3 +oid sha256:aaf15965a9a06378c7f852dd52d89df50e6d385e134adf4af02f7287574f160b size 16384 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin index ed1f961e76710450c7d5d60dc6efc4188c61a1d9..487c7b03269b08d750b03a54c9b8daa2031f8e44 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f9df04837ea94fe26b06971d5ea4373e2c1787e0454f1a07a40be4b7ed491d3e +oid sha256:fa15212d02fd93611265b56ae98073e8df9c39fa11dd951d25dc73ae7c23161e size 655360 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin index 7f2d05d4b7c1b3adabd49aab51eaed88c493004f..099a6d71dfba99c239dfb2e11be44b77f263d197 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a76081e216fbbc68d54fed9f36782cb1ec75e3c46c502d65335f13bde902ed9d +oid sha256:25bc94907fcda7ecdceededafb999a692c98ec11cb650db24936e5ef633806ed size 4 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin index 11535f4c8210456ed9f6d1658b61e49af62cc4ef..3d2ce69acb0b6bb361addd2ae7ad4d4a4cc01151 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9d76e958c5d851419c40140a50474af301ead3f5a16f22c02d31e37c0ca631f +oid sha256:97a5e1525e46a22cfc60a23ee4f5481ea11f3ca3ac5ea6f8a3ae7bdd90397012 size 2560 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin index 67bb4db6b68d6ca9c01e61a85de689fa9939aa99..b6200446fdc7ea1a5813ea643cafa58b174bedc8 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e05789409db540df482a00110f6eec694cdbbbef2c9793a1413be2828cce36c1 +oid sha256:c17f9cb3942097db7e1cc51d94d570e1c1a1a5fe31649a8d098362d756556f03 size 327680 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin index 4d8f9978623ab922e709356f12297e6ea9c0a74b..53d10937f3e6d2068dba3ffb5f3e32f34f880b8c 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6fb8d80b3587c6f014292d592d6208d3bfea3f7b9cfb6fbd95b04abd470a30fb +oid sha256:e771a85f2c8eda7bd2e67b1eb563931e0cf9ae4d9170d42412649041f6bc0ba3 size 4 diff --git a/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin index 2f6b69cfbbf3df085eed906d6f0528b303e03c89..2556f11c8430afb9222e14b762d695cfd5e47914 100644 --- a/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7163115bc71e1a6087c257f47f457a601f61df0d0a68ae7ddf510c2bd610247f +oid sha256:df6b0c4a3539a35bc6bf6a933fdc949458d51ef7c699f56da3b7d39a7298c735 size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin index 2233a086575effdd2f9fd13dcecbe21593075f01..bd103a893374f4e3b83bce909069f046c827b29a 100644 --- a/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:22b15efaa6bed88b4dff49d05a51ffefdd2c7ef81ccc4791b41ea5f4c93e0fbb +oid sha256:fab7acdb1c2d26fec9ed3d0d00cb625d1d47f26530f0526554fbe35d12409b1f size 4 diff --git a/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin index 056b788ba76553058d6914c91af81aab7d3c8d7f..e90b4aaa1636fadf6077446b384ecbec31c9881e 100644 --- a/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4132a59d48ec7d51ac30c3f4175f57e889599efd7e625c797cbb8b5d831e93a6 +oid sha256:48b06288bc81900b14715d87718e8eeda0c60aad102b2c506db1f60e30426d25 size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin index 40ff67010454778d221522e1881235e29ac88832..fcc748c31e4c2200ef76ac316af7fef275d77ae7 100644 --- a/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6a6e109563dbf7d40b494d34532e95a304b0eeaaa2eac805d391b0223af6dc77 +oid sha256:6b8105fa87a0c153c3b85b143ddc7d8345e3f5e7b00609d57ecf05ccb37e75bd size 4 diff --git a/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin index fcf51cf8c70338f4c5112d4f376f7d6f46c0bc05..2846451f431a0fa09ca79924e6b371858c0abe63 100644 --- a/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e128832a8ecf3aeed808b74d87dad67cd255c2db6a17b162eca7d3127493bf19 +oid sha256:b80420f9122112b055341b9e6744e99760716a5b5ab9a8d2b616a6677fe6e51f size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin index 9bd68f21210bc0252817cd9f1a491a27218a467c..a5c3d39f13746ff4f461cc6feb3830b1f79cb109 100644 --- a/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b0e4dcd00804a2f10d5bdd9ef2e26c9827cfa86e628e4a749b1220ff0b323613 +oid sha256:f1cedf6bc25edc3a71af61cce2e793f02054ee85707373183901a6d7bfd9bc02 size 4 diff --git a/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin index 5337c4321c083e748a8955a16181e50e8b6dd28e..b7eb3dc6d0c167e1bbdfbd9a20a7d87d7d32d468 100644 --- a/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:523d4f77f2c9a7c743935466c972cc168287e14dece99d40238b346fb27f97fb +oid sha256:1a2cbf704f1f495d86f0dcee2ff15a889756988f9ae0ac8b74545dd27c9def2b size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin index 669c6d6622236780ba875716efbc97d2fe8eff68..dfb83608157d1c0f6c6f96af08b45112ad518918 100644 --- a/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b9fc9730e2c668496ece1d4a5de9763bc44f2671b241a1c1debbb5ced26bcc5 +oid sha256:df1ad53be309ab52d1870c805583bc8f1f5747febc64464a8ce2d871b91c11a9 size 4 diff --git a/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin index e057375698ce15d6caa4610ddf64ef164b3bf90e..0376a3340947ccde09823b69320acd54a3053343 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fa1ba39d161738e5813daf52c5771c4b342fbb0cff72e6f002a4ee2ced15f2a5 +oid sha256:62ee98df5599d0fef4c7e56e802677f5db362fe0f3fb1940c7b073a24ef84a15 size 16384 diff --git a/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin index 25cd68881be485b35549b9409a87fe1bba6493b5..0e78b466d84b9a5e53bf81c970841c57282f3759 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84689b32bc8ca799f9dbec89a8007bf21afbbe8112aea203cb54ef49cd0fd741 +oid sha256:6791d3fd41589fab3eda4e56c8537e654686e8a90dbec04bc4f5dca84b23220d size 655360 diff --git a/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin index a942bfeb27fc1f9a9b34e99ac2d7135ace9f5ce5..e2faa1e115882c3983c0a70d66c83dc687e612f7 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d2f1117c13f4e19bfe03e087a9701a252e538ae56a8b1ee89e39086101359b27 +oid sha256:d3e6af24929fb6449c2a8510f5ce57d515629a5fa3996f6fc96993a698a8a337 size 4 diff --git a/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin index 61ae0c22c9f4ba581f16a750610a6fce4d7751fb..f525389a091285b05fb5132593c014851b76c843 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a1c186530cec1e3ef538bf7a766cbc32991dddf87af3906987f90cfb231bb7d3 +oid sha256:a98d0431811d1f5bf2c1ebf562d91f3ce65d75d64520575efcfcab46e018b2e4 size 2560 diff --git a/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin index 7b2085832e50d1019fa8d2738965318bdc4b36cf..7597b5d995d3f399dd0a12de88d4875ec14cf17e 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:243056cfc23ab07879aed6d68e44c4a03bce85cd1d33916cbddd05d3ad558647 +oid sha256:71cab0c976abb9f5a8f17da4cf8460f356e31729d1e0593a2e5aa88e41a458f6 size 327680 diff --git a/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin index 69cef313e6f78a0c03ec75ebaef29e4d8e161f5c..38ad3d04f49da51935be81c044cde23b04046478 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:23fa500a5c1d7fe55f6d2e59c571d48b88c9dec6c1efe09f3f3f4cffc4d0adbb +oid sha256:2795d779ab9f77b8fdf7d144a1d92a34d68a4af9dbdd2f7594fdcfecde3abadf size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin index a250e47f8a684992ae0f7bb6b7f350c2392644ab..fad17a412fb28ebcce76824ed54d0317631b0ff6 100644 --- a/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12099b3ddd6bdaa49ad496020dc79416d2cb6e18f19704bb554190d434ab7155 +oid sha256:71837c8df53923a1eb51839206bc2964dbb5931829c8bcaeda9baf89b1fd222f size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin index a8fcd54b346171d5e6f489d37daacd9ba7618d08..26611118a039c59ecd5b4977cebc723cbf0929b2 100644 --- a/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:18cb18c1ca9df4ce1418ee60984e026d87470bff9d8f4f76327a33de17ed4361 +oid sha256:c0ee0049491ee814569ee869d71112df87a78155b57e8128d03d2bdacf4025ea size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin index 23fc32d375e5a229e11f16983bf2dbac39aaf685..df9d5b4bd178a5b4ca505fc00b27db39610a9076 100644 --- a/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0db7a1ab2c75031956cb3abe22317c64ef8e11fe66ceac512bddcb13d8d23380 +oid sha256:16b3aaee9a4357d85e3911304dba4b92f256eb99648014896c74b67f15a881d4 size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin index 00cff92d79e3dfd373e5d22869c1a1946b0338b6..a6ee7c093a1ad963750235f9a021e4e2c6f5ae8b 100644 --- a/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ff4979e14dfd682175f59a47aabac427a7975f5a4fc223fa72b96cea3c229f8d +oid sha256:60debbe37b6fade7faf5609fbb09417ac8d679f41834db5f00e7c07f39005e8e size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin index 5a3862b07210148d61d13b2afdc9f856e1f2213c..19e076c5528740ed9d3d1a52eca7e8d87ae6f03d 100644 --- a/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fc2b4a3dda7010193c94d86591e64dc466d629981abb4e008ad60822c1b0c5eb +oid sha256:a46c45fa4b4aa8fa996feae44e7be7d8820867af2449e0104f53fa6775179fb1 size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin index 81e4e814ec6b703ea86276a56f856b3e9c8ab9c5..0d93d6c9382b51ea87c2cde69efa2c8a215d3cc7 100644 --- a/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:594e276d9d79525ee1e48c2a8fdcd54499ef35e7722735cb1f996b273ca43e18 +oid sha256:08ad6327be95f2e8252c0521cc183e9262c5ca80beaa6d34484189cd74f5301d size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin index 441dbb1c73ce02f7435f298bae5171bc2a397fea..6132fd92491a38a7d995e8144908cfabba384ef6 100644 --- a/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ac7a8ee517ee14bd8fea44595f29da3148dc5d16b75cd861672c763e16ef453e +oid sha256:9418c8f820fe57f66a6d297cf58d1d7145ee125e5fed29cad668c4013b55b5c2 size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin index 74990aa94141a258e15c3cd1ea71c22890473d0d..757bf725ab9308cf465da99a5806de780d1826d6 100644 --- a/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d5694a3a00c63856aa4ebaa5123cfa03ea6aa2f9e43b376846a07a55bddf367f +oid sha256:c006a324dff21858853c4e4aea09fee0a0ce2f52a39ad72e78e7390a5245970c size 4 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin index 6c528773933559e1876ec2c09d3f5f492871174b..ee48a34d5180cc380125b5186a2b729a9ba082fa 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a05fd796bfabbcd856a02eecbdf1c61615fc0bae9bb77141dd55c871d87b4fde +oid sha256:a9f6b4f1fe22589729eb0d737601b23ba4cc9ebfeadd09523d1ae79d52f3907f size 16384 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin index ffd462042f66224d1fc5c7b762a94d75c6715644..ff123fa8d6c97ff6e46ffc9128a2e772f1058cdd 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:254e4df1cacb8057dd692874312ddae05e490c57b26ad1b9ed7e5b402bb7c104 +oid sha256:3aa11246c81fd0bcac67c5f26df2ce838eaa6770c6e8b188a2b1efdeb7e9407f size 655360 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin index fdc1eaee2f5330dd7cfc21c43fa8b87be3ac6926..862e64f33cc5e21d105013133132ea1510d79462 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d140fa74601073ef9acb4600f6f1bfb6110f72c6d7e082beb6820f0252555a3e +oid sha256:3281853fb7157f4e1e939dccb4fb652dde048d34458a09602421121869212659 size 4 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin index 4a135d6d83158b7373e18b0cb03abd5f49bf0a28..76f4a48f50fbf91b039ce3e3987cec867565eda6 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c13837272232ed41d7e260f3b31b5626618b8c3d9acc6ad54b63809998ead325 +oid sha256:57e85c9d9fa797c785031a5297b55baa622fe733fc2cad745c4def4220e6de49 size 2560 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin index 13a58f1d92c73f5e5d906a6370fe1be206d7bf88..4ca07d23bf82aac81690c231bac994ae85dd19f9 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72ebd4c2d0042090da61dfe3a7ac97a48f195e2ca73e15a689d0457aa10c4f9e +oid sha256:08c636f9bcfbb566fc98cf944f6410f7d07308c6885130104ba21b645b54229c size 327680 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin index 084ea45299387d250d0f8ba6f65ef49404f8a1b2..1567165004e4990cea5b9cadb8ba341c1fd6c20c 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fbf47255266bc2a81a08229c4b3ccfa1469ad237636bb161483e3b2d7fb86be9 +oid sha256:93c67e503abfa2b964d6fd04f0da9d415189c99c05d16fd58a003a8819559cff size 4 diff --git a/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin index 5aa7d188f2cd5566b198e9c1756c46020a107a24..a88a1d5036525b916a88e9111cc385c00d547b22 100644 --- a/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:477aaa3e3dd636d2a857add391fc8a3a2f4fd26fcbf30b3cf95438cbd590737e +oid sha256:0935f374bd55ada307174506bc24bd4291f5c72db145af937ecd472267d646ba size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin index f79b7fe6edbd26a1d9f3c6554415e37b27710574..6002c9b50481700d4e508b2f80810d17a2b8b640 100644 --- a/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92e371e8f1578aff6796f3ac4975c287e5d63174323035efffc1c931fce54f2c +oid sha256:87b6ef8c6d77f5a498047d9a58ee6fc5e3296b67a4909aff8735fbb783a18b0b size 4 diff --git a/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin index 8e5edbda29b165f4267038256ee9177f94d2636c..69f0997888c16b70047d925d671bf59098dbd4eb 100644 --- a/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10dfd78a5e363fb05309f0fa3ca5a8fa688683439e799e2bf5190fad839f07d8 +oid sha256:e6adc5855efc0bb782aed30cbe0c6a1b2f8c80608739c6c88fdc871a8499737d size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin index 943433483f48ea7b2d8113d4a08f0013d7208954..f08d12f1dec7ccabb8222b6503c73fff5aad66ff 100644 --- a/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6d5cc8f071d2dc9ffe100d11d0b9f805a71ec3f0e1dbe74a4e28ff79176faca0 +oid sha256:ff846e9985573ecd305b77a54a7e988d2144dc5adf9a6916813d435e9ab561cb size 4 diff --git a/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin index 182b0bc46126b77770276cfce86fa6f238b32de0..a356888a529c9d67e1b311a8e9eb0fe8ecebdd6f 100644 --- a/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8f97698724d741ad7f51f5dba3d951f331ad800efc11f922b102865baffabdd1 +oid sha256:11cbf72fee9113e4c199fabd74ed6b5292b90eaee86b44c1adccae8ccd942783 size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin index 8c653e4b58d7d5e3c1285d50c46784674fa47f7b..c32011440c3cfe53f5d919f472eb334525bd9599 100644 --- a/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2632ea079b5113f382e81cf1782633e02e9b4ed1146c56b171d669602897ad3 +oid sha256:6e0380b2fb97251dc52cde6bad28c297473604cc977a027621c9baf7240444c0 size 4 diff --git a/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin index ca13dcaabd074a05768ff1b0226a5f6e85e25636..bcb42bd8d1732dc2966e13eaf2b1c8a6aafdf394 100644 --- a/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0acd96871682cabaeda0c52a369e3320c4fa2267f2447df644f5ddfa00807a9a +oid sha256:1a2937c81a609059d506dc0346018eaee4ea694d4ec4a28ea2f216cbf9fce034 size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin index 231a32ad2d32766611930edbcd6fe17148c8aa71..e87119edb4b65c612a8cfce65b6d7451d94f2aa5 100644 --- a/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2e18e9c82d54908c20217100cc44da0690dc7d126e8ccaff3d55221cceea5e1 +oid sha256:0faeb054329b75c4b46fff740fb9bff988744aaf029feb19b27698d926185604 size 4 diff --git a/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin index b812577df90213769db1f425fed509e999dde93a..c47bc4e1c74e829374696dd3c9afa28bc5987d21 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b55b6b210e332ecf839d8e181f76fd76be84b835972c103009c2b8f42b105017 +oid sha256:e849a329a8fad72a3c78519452879346d4610159c55ba54cfcb9b781f97cb30e size 16384 diff --git a/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin index bb3dd541e7a395847179bf5a76a8edc5fcf1ea4f..64b00ec41a5a7e8fa3f0c7acf8795ab50383d4ce 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:61423b913e96c820c10dc2a26cd5c4de3e998b1b04dcf2fd4a41aed1e738cf7f +oid sha256:b42b255a137c29ef6f63d5c24a0fc97de401b6f9b34d30df779ba7118912e2e0 size 655360 diff --git a/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin index 6c42edee77ca9e4c2ccf8a6427460d3729e17519..7073a920c593852e8090850b7e20cef3795a7c90 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:08f0a86a075e56691e5f5e3bd404c005147007c9b6b0571b8bc8c07737aa3d67 +oid sha256:c7b72990e8b2ec40c9892aba65b9cac0622cbc6ac1ad1963be6f12c45530c560 size 4 diff --git a/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin index af2340fbfac7e69586eabd6e05ac0e7c8ecae794..ebd098b0a8423150447a58ecd4db09064c1efd09 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f1b6d2c15741c6eab8cfacdac19bc54f431fd2432c2f39afa48b6058f1f343e +oid sha256:2c675afd5742963783bf330d279082e56a8b5538a9939e168179c89fee8da7fa size 2560 diff --git a/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin index 79bcd7e96d7399c04c6a27b2b44ed3c38d9cd56c..68e65e216f66ac6773adb03bc7237ff566affdca 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b695846f6c7cd7fffbb50080475d1b2f18cf5312be049cc47802b9bbb23aa497 +oid sha256:ef232657569eff68765131f1f78eeabb02eb1775709955e07c99ba4440570bd3 size 327680 diff --git a/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin index 4de4064ac35baa934a391fe27e137a43335bbb4d..43afe180256d99dc2f8385eb33b56ac056fa2bd1 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:91fc9753ecb2e9d8f4e37de4aff3cf86d17969af54f6200871685ec677ed1ba2 +oid sha256:00ff62715519571ab08949ecbbb673535a3671d32b1a9eed572e5bbe7aad8b7d size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin index 1bcb13af9575a15c0bd3937c4b9f5c4d7e433e5a..7ab1efbb875052c3646c971a2d5b512f3be796bd 100644 --- a/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:af216fdafa01c70a3c29f06a2cd89ca7548588df5005f64d722a063e9df46dfe +oid sha256:d8566006b654e57a85cf7e668d23eb6a8b00bbea8c920c5e3004bac61d165902 size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin index 7264da2701eebbb4c63687342f473c0389d6325d..aae5187f3eb03081bcfd62812eb0fd093907b83a 100644 --- a/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:040b7bfe0dda2f2e3885d8ac903ede97b7c5c54ff3a60faa0e7b2f8ea1b24eae +oid sha256:92d66a55428f7813a0c25bf7ea743cd5fefba17398bd3cded05ceeb46fc4e665 size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin index 064eb3e462e4fc7da8a05378db9648e564cd9109..9aae190b1703efed3347f0c39abe00ad09efc186 100644 --- a/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00e16ff3ecda8c9f89eeeee4f1271e9f7b7807571970e15c2070acd6c7a36190 +oid sha256:56465616cc74db684e4cf91b6a4eaedf20d2dc0fce3d52e80188ad2ff4b17bde size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin index d05411381cd96175f8cc552ca10fb6987a395b68..05b6d40d1725745e6f0b11ea0047ff034415606c 100644 --- a/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03a834edef6a098c2fca9315a4167ca1be9634782657a9909fa48bf313711a04 +oid sha256:64be926fb8e3f7186096dfc7d71be5ef1c3adc4b3ca4cac933399f06ca4128ef size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin index 9fc2918218301e3546a116ec688e98a105e8f16d..4dbcd6094e0083df06f007a0f932e4458882b5d4 100644 --- a/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:46638b7393c85823b8c15351aa8b337ad6b0ef45d4580ed4d6ed039a056e87db +oid sha256:5a8b72acd19e793b8c0299c75b992f12f268403a9cd011d6514aff9d3232dc1a size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin index 5f47bec07f36bcce85bcbfea50e81ad8f0ab9554..42f5bd3161f753172ea5515f8fbe5e6ffc55e3a3 100644 --- a/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:200b76613bfdbe2a0254ef01611444ec15f9de52fb50f81dab3d273b4b96da62 +oid sha256:f0b2ad4c13d7c55058e593fe97242797f9c3bf699d4b4382a1bf45cab3145f3e size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin index a840f1dac8a68086293c3472e4aed25f1af2fb18..09bce7b4729b4762121803045f85b6d93507ffa3 100644 --- a/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:74a9caf4caf5cf52645f81f8b0fc823e42084f822da768e2614e6066fb892581 +oid sha256:db853386ca2135aeb2a21e4811a96f6a7f5e38ecc356057cd61826dc281c9a1f size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin index 171a218d39f9cb4b052a4a5067a07693f3da5a65..b544245ed025a054e8f67c40fc3b0aad2a17099c 100644 --- a/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6bdc606c42114297c497963ca58b5bb3be4ec11ab89424a9a1d19ecd9fbb84a0 +oid sha256:01159e95ff778abe2236d0492dfca3d20d14a6b3848f0583586174cbda64aaee size 4 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin index f351c2a0e16e24c44f4756bc2ca4bf96e58abe89..9b7c798ace3469e651c12ebcfad4cddab9fb5bf8 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:760c1ece295a8913e80f14927e266520a947959aedcfb2c38b58af2f920b2f5e +oid sha256:8698835f3c913ac1a26c481cbb8bfd690bdfce971922e3d7d541a6d7099e3977 size 16384 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin index e85dbf64fa9bd4121809655d20f7fdc765a31836..15514be166060affb200cd736a67255795956e65 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4d52aa7e8602cf434845d833c7814f3d81462b12497e429b61418c0b81b39959 +oid sha256:375345d99dc960f212fcc7ab73fe74e618167f4bacb0e34b3d5fd75682efa4a9 size 655360 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin index 0b3edf6a31722ce036768f7deae50347c6c926ae..0fb828b34a7702e0d066bb017e7a6b15f0ab536c 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f7a83807f3dc29cf15f6cc3e6dd2c883491029cd88085c34661ae464a2d7c2b4 +oid sha256:a93671fb72d1708202ce8296acc051d8cb6e1161c733425448bf66fea20c1115 size 4 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin index 02da5817149b39b4f3ec4754ac31e414b5ec1ed1..d35a3cb935a5be24f8d3ac01f1dcf6671ce901a8 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:43f6f98654b26b0732dcf104df7c540836aad931c7878b05640d7fba87a90d9d +oid sha256:815889ff5b4eb207d60345cf0edaa41e14ef55598c0c6f30289543589cad84fc size 2560 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin index e2dc28c44f2f74c3d5906e212765c803dd9a332d..d28bb4423ed9e5dc1335d89375f8c511ea470657 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:607fbcf1a60bcbf4076552c0c51cff2853cf36d2f2b7a6fb02f8624033486b76 +oid sha256:2424b38121121a0387b71c91d153ba9debb8aa9fb2737ed1221c2606888475b6 size 327680 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin index 57f767a57abf9ba43bda72a1b7f8aac7f4954bb1..ed72cc561787141dd2d7def749c3c49313fdd6f6 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b86ac13eba188e7744a8064948b792bbcbe74baeeb602cc6d1cdef84bad3b00e +oid sha256:a104324e1e7cc41a3f01509e6e8ced8e762acef0fabac4544ffb92b443d73019 size 4 diff --git a/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin index ae7357131651cb88c9552fa91116f80fd3e151ad..2f533183a6f1e0590a24cb7a885f8765f98e0faa 100644 --- a/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c42933ccb66f22357bb4e6d65e94956b9d818f192296b939f38847111fc520f0 +oid sha256:0ce39dd91774074736c5720d2ef64ecab695ad08f57343d5e2c97b11448dcf18 size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin index d3270bef111ecde71284f5763365c3d5006af307..d40caa96d40a07f6cceef86d3dcb15c786f26c2f 100644 --- a/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a0bc89dcf0a96b2ae6f6f5c25823f4bff2d2a01eebf4532f8aa65c79c4643bec +oid sha256:a1f0f48bb45d012edba1ff192711ef50e47cf6a92a0385bc9e319e3f2478476c size 4 diff --git a/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin index a49504998b099c04099dbde0c9eea125d6e173d4..1a103029f52bb9869b961c75ac40dce2f2464c58 100644 --- a/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:018bbaadc1966a49cc913b807f3a54465c8a0a2a1f566e91a57c172a0624bb2d +oid sha256:37f9d08deeb5da3fd5917e830b09280c2ef8698f513cb4fbd48d441278b63d4f size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin index 5fd69b0d548592879fc9752cf6ab4328879dbcad..949c929c77e2ee8b4dddd4e16dfe78b32d1adf52 100644 --- a/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8a67d2ef56ce256ac2ecfabc2f78e2c28089507c9715d21fce13153ea0a93cf8 +oid sha256:6d056c23594e9fda03e1f0045e7bb77bd977c7ad97ce3facd6079d7e21539692 size 4 diff --git a/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin index 88d38aa7dfc2db42153961e4625419859a3af4c1..45f79db3c5552da3d3b85f6455cca29b9f44ec11 100644 --- a/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bfd163ff0dcad21ccd7fefa73fbf79ac9053c709a5717e10f75b6fb936dc8c6c +oid sha256:f89dfef1e375b5f6cddb72810c8f43663550c1f6617a0689ebfb9ac9d71d6ce2 size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin index 672b61dc7b0641ce9a97bae392e496524bc1039e..895819d59a2706bbd8f55247a9eded3cc3f86cda 100644 --- a/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7f4810a434b0a8dabbb5eae5b0fd327442680722039f8645b6bc00ffe3654ce1 +oid sha256:86b0c2ce4ea6968b0d5bfe161ff5172eccd9b6ebc1a81202bd03f0d21394be60 size 4 diff --git a/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin index 58f612aeaef258c6f00b85aee3be3696a2aea0d8..5ad4d6efb274757945ee5d73becf3e3d622b0646 100644 --- a/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:566aef9b1805aaa57df77ebf90224e82bd2ff3d6a815249d03e5e11c5ed1c23d +oid sha256:1a625004d390f89ba744f0e76c635ef5ed804ebe321d4468558a81037c02f97e size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin index 22e074442425475a06460baf54f96bdb0a332131..7c269d23439729fde3d151acd3eff26e1f940d58 100644 --- a/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9536ed49e49bbd570119049a0116e4d11b8198a1ba378c107175ee7333d72ac9 +oid sha256:9df9184076a41b00dcac5ab27177869f612ff7b7f6f9fa2e86940b111132a375 size 4 diff --git a/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin index e295240708de4757fa8ad07e539eb0de7eebed1c..d8e98f88a48785ce1da953a867e9688093260a7c 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:504553e77c868b26f1e9a3df5d802722876c10ed42a3022eba8fd37483108c12 +oid sha256:d15970cd583a238ef5df0cba7c57f0f0ccea9051feef6c83b10eee60a2ad92b1 size 16384 diff --git a/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin index b1149f85fb281afbffc9cc5fb3dac01ecd62e203..2161ddd2864d4c38592661f8f2d53b440770ca06 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ee380e03abaa8eb75539e908a009a2c0fab2af231ebf9c77ccd8bea01625563 +oid sha256:a0489721b293b3ca1fcdf662c044237b0ae07aa9ae460fbd66d6e4d4edd68b50 size 655360 diff --git a/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin index 56e7f0b8fd1117ea58f6e3138237522b821d3341..564f0e322d7a86c09fdd5f8d1f268ce429a516f4 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ca2393d1d6cfc924d3705620afae401da0a1057cb70a627a762862d880e4dc57 +oid sha256:a877c0e3d34e4de0a55784c90a53c41193d06d932cf356643e0c9c39bbd877d9 size 4 diff --git a/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin index 2ae3fbe5ef2b061df38a67073a7f0e9e7b5c4344..fed1ee22ce90b8c50b162f8104b5d47b2c32b0e5 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7e2f8fa91fd415e7df8c55898beae2a32c79635c3f3e14d7f474dc27d7fe7e5e +oid sha256:c4706434e5600143b8000b42086e5876cd70ee3f705c9b6f660650e61e6704e0 size 2560 diff --git a/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin index b7afec30a449e776e8828426beff405237d7ef1c..7d108b5fab00e8169e44da4ee2869ec660e36634 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6ac53ae9a8d1b549675b173632028543b73aee8bdeb52165739a5dfb8e01dcde +oid sha256:f902606d6093a73f74866075bc990c9b1fa21f5ac3918d82d52531a6e6b27dd1 size 327680 diff --git a/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin index abed75136bfc16c147d01a3ee865d44b9eb464dc..7edacd01392c1ff0350dfd39108148fe323f3601 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17a1ad12c4a297e3333fd1a00dc1afe0651cc68e2f927a9c92358990a400794a +oid sha256:5ad60db274db1cfe4f344945fc6a354a9a75fb2666c99b8d13a85eee28be1b57 size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin index 658f9de3fd11c2c46d611570f2e8149892d7c556..0cce86d6ca4aec15d0d91eafc18dfc03fc3bcbcb 100644 --- a/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a6452884ccdc02ec802da82f200c4a80aa1e2b090849decc9b51230e621e812 +oid sha256:e300586d5091990a15d12e681e43cfa4a00af31f8a6f886e446f770e7c554271 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin index d64b88187cf5446a8e12e316322e81175d1722d9..0fcc0e72f4e16aaddfa8d2a6390783eb104b0b8e 100644 --- a/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f3d67151d91e46353e8674137bdfcd58cc7c68ba8effcf87a6d0e4539183dd63 +oid sha256:b27f63a35dc17e8b23a4dbe85408fd3350d5083c9c8312fd18ff16345eac0a84 size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin index cfa33a9daca13a2e585716a9936988c65ec35d7f..a578b969ebec6ce55c33b38a7734fbad5fb4cb41 100644 --- a/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:abac573fcfcb72212c55adb43bc1db1967e7e78a374ec940eb6c4f5d635ea06d +oid sha256:5373c29c4a939b97eeb54207b6c441a0fead033399cb00e36beea3dbf941bac2 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin index ff0f568f8856d5a1c33f5c9fd93778239bb317e0..c7b7856010476c25445c6ea82e22159bf72f21ad 100644 --- a/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c6799bb383071e94dfadf6573f0416870ef323ebeb31e87626ed137e44c98c6c +oid sha256:3d1728382c159072d32f88230a61708e950d6ff133929cd12dea8121d83071c9 size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin index 846c09e6da30afd3c9290fdeeb49978d9015c95b..8f3a799352dd33f37dc484e5f65b34b5068f479c 100644 --- a/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b6abce78b00434b9b260f5dc37b7b7367830778dbceebd3a9d6f8527f9c99d86 +oid sha256:45826f137d54cbb649e5c6ae6dea1810936c192577dad65f1e7a847984a81004 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin index 1c78c3a5e80443d393ef388b24c1e4afec630503..04381591d65803b0351b6d521f5977baceaa8092 100644 --- a/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:666df0214bb1e28eb5f382b2b12181fcdf9befbac704d819b8c60fd9afa91a1a +oid sha256:33bccb48e0d40c9dc8eb90a23cd8c427e7824f1c930fe20d90589cda3f5bb030 size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin index c5cf4dcc92c7efe004868d13d2ac7891cabde720..9e46417aac8944f8ae5027c4c2d03f45c273931d 100644 --- a/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:be998d5ab45cd4790a8c69a33479b59f65f938618ab7e8fbd56a7b19ff9abfad +oid sha256:8331e844e9535e0c325edd19e161c13edde32ae663380da09025993cdea60422 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin index 762536fefcb9491076295fe0cf2440d7b46f7637..07e607db2e91b409ac8e7a88eef9015716ca0f6d 100644 --- a/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f5578ec265f37dc898731cb72c748c24e3e480a64d5788c1815617687d3fb24 +oid sha256:2d4fb5a2384b1b4bb2f482db3ec538d363a09e046dbd54e882bf784c6a5c08f4 size 4 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin index 41dbc43cb9c6291cb5a0d5f5fb1e736be47c0de6..e85e593b32b6a046f79c23e207597f484f35d1b7 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e836b2102f7f826f339bc7b014e07782d3a748c773f10ba3b01b940d29b44182 +oid sha256:58cb7e7aec507f1957187d6fed32241c60b2b5d26382faf9ae0a6bb6107ca974 size 16384 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin index c7c920bb807893ee63476cb8d1ac461ecf0ae65b..3172803c97fdd90d289abda70bb31a30145d6275 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ee9a82a04d0e4459c4cb7f94c28d2686ddae16e6668738edfa76cd8a013666ae +oid sha256:870916449e436f9e60f60ea3e12f3435e863dbc0becf7b04705ce6f03206a44d size 655360 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin index 1f9c6ecc47b8341f329d9765104f446fb870b0e2..0411b385f949f5fef8ad70e85da6fb813807b973 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:65639fae837d12338698909216342b9da9ebbc2c75d3058b73fe5b3d8e342350 +oid sha256:2e4e7df77ff5c2e5cf71328c80f8ec401a6f624e683790badd0b7aae32da3c2f size 4 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin index c2c052ea42dcfd1d0956967b586665e2b0777f03..88a896d15a3e6bbdfac89ac496bb4f3c6897bb71 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ce15af4c19781b8525971868cc9fb94e220f1867242fa7faa61242529661471e +oid sha256:e39e3873069fd6a675cfc178936887e12f6aa51d658b846ba25a978b9cabf735 size 2560 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin index f6f0cbeeb511858e8328a18935ab90f90eaf5bb9..30c9b09bbef65642270a0ad98195cdcf32a6cc17 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6aa023b652ea8cb4c15cda43b758697397951ca79dfef5767f4bd1e0da99ecdc +oid sha256:0d20e20a86bc772bda2b92d98747d3711be44c4d86cbca7c3984026cb346dbc6 size 327680 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin index 52773e687303fbcad086e5ec73ec1076ee98484c..10d943234d5b1a01d71135081bc6b056847c6633 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:20b79d91f90bd50129605b252e0a23dcb120666afac4e988e997b4cd6496a4d1 +oid sha256:91a69820c780a5812087ade3eee56f8fa3fd4ecb49c52fbc788ebf537cd87df8 size 4 diff --git a/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin index 03919fb5b2b7d39764ea610efeb189f46381e170..8970393d39fe6090a0adb89bae1aac20dc3878e2 100644 --- a/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2421fa0bcf4fb2ff3e2faf11d960666dba196f5265ac3c0c07205ec7e2188589 +oid sha256:f24322858b2d972eea75e282e3a7a48c77cbcad77e8bd6de7e01e15dedf32329 size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin index 54e07738532849ad0941fd305ac5e1f420c33dd7..179c7dfeacc16d80b4e0b15f72e8205789edaa40 100644 --- a/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a6e13b8b98f8f3a56588c424d0f0eeb2d97ee80fcdf8391d94e81fd0b041ea63 +oid sha256:6e9a8bfc36c2e35971e6976656299647b36e4a24e164890b98bcc4e70110e76d size 4 diff --git a/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin index 60a9b71e8da9ecd2076d4561d8a85b09f6c98b93..f7172722f62c2a925def69e9a39c0b4d891e4f0b 100644 --- a/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:beab9c7f54cfb1f245c0860f6fe4a8e1cf07b68ccf2100119184d157905e6e0a +oid sha256:8925a3109acfe4a65b89a643b38a980440ad8000565dbcd68fd8d9128091965a size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin index 2b3af0a8a0a47efc65568b96abf3c69a73f4ef7e..b7cbb58fa3aa7cfa551794a72d7a0a8785ba1775 100644 --- a/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2b8adf007a2bddfd616002af4fddddac73e836196ce335a5fbae84bc40f3b7de +oid sha256:6d7e412565361ac5fc632c4531b71b650dcc98ed6614078fb82db77a0fbaf7c7 size 4 diff --git a/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin index 8381ba9b8239620e79dfef7db9e5c316443b6a88..14a09f029855411e26fc9329583bad5f41bc48a8 100644 --- a/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:210c10daa667e6479481d6d3ba2f0ef98b5a7e3f0bd9e853f61937c966a5663e +oid sha256:0d27485165aa65ac9c0302c40afb801f24550eb5e02761361021024fa58aa45d size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin index c22df37bdbb2804f4a5f7a6fcb00416e8dfcc552..1c5b93d01ebcb0c0978feb1b6312f780e8075802 100644 --- a/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:63743e12bc6c750bb6ff44b421e2eb455acc1f894b52d27c31a9db927da15569 +oid sha256:d3aa0d2be93667164d611db40a95d945427af758e978c9f51df73d98e33a65ab size 4 diff --git a/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin index e018ca3b3412aac6bacf8546b61361d2c2716941..74e22ae847641a2d59845447f3eb483443ace955 100644 --- a/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e99e62d118e9ee188448b44590afb392c48a14422a7087ebe14fad5f1ffcbbd4 +oid sha256:0252a685fc4582f57ae143d51ce3fb8973e098e24c9978a920e2d33fa4d59e98 size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin index 30ad8d1bdc47bcc0ef24971a4c878f2b1968de48..fb2c5b69bf53342b9042023c835fd4b4404c96c2 100644 --- a/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d031e5ab601acfeebe4a5f573155fd552b2f9ddd44bc9920b6748d3915704fd5 +oid sha256:cf740bd129cdac2d57821e98aa6b0589bf055d31c0b0e7a8ec7109191d803e08 size 4 diff --git a/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin index 1529aaa3e8ae48e537ffc71acfb5f88654913b77..1ab280c1e9f8d6d93b7a738aea22351ebba3aa5c 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f895fa89f658cf7074483d010ffe6c7e8fe79e24c939268b27b8ae0c5a38415 +oid sha256:178e819216d729a089888c37140a99b1337d1b8866b2ca2a3772bbfa80d8384d size 16384 diff --git a/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin index 1f586bf3818bb28de9a29a14300be91a6d6b3c26..b84c176e700afcf39bbe5e58895290b5932006a7 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:41304fecf261465ff3847dbdee49472009d2a3262b8dbf7fecf31ad0854dc5b1 +oid sha256:1098e01a4c56b23c62db470d2def0e876e78074521a6f26fe101b323ef914b8c size 655360 diff --git a/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin index 3faaff067c2acd5675cd055bb96e02536c47ff73..f12f3d860bbedd809771db155c8c8ee7fdecb1db 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c347d522ec28f95a2e57dde268763d465598af66efe957ecd9250e87f8cd85a9 +oid sha256:689b925a8e9594e32ed35cca127e7146ab7c932b50f31091455c2ffef93ab574 size 4 diff --git a/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin index b522d78bb5297ad3632efdb7cfb0cd2944e6d298..d05f0541ad9427bcf21cf0550b897b33c53f4168 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9bf3661e4bb1f05bb419ff26865cda4d421d7abd79d47205791194e1807ef461 +oid sha256:05d28eff762fb39a07cb0f87dc407b08eb966482efca2d63556b1803eacfd613 size 2560 diff --git a/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin index faac8088fd473e2cf91c15d4a7346b627b98992d..e9ecd8e9319e75c38b7c19d1ef0ae00ea9ca779f 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90ae1df6b88f5d3a90f4c345eb78be91c4aa0879c80360b5c3da63ac2f2ea568 +oid sha256:02b49be34e4473aaa3a36f63004abd08395cdfa30c78f79f1aa8ecad314f6e3c size 327680 diff --git a/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin index 8de468c3132a048a683d04fb0e2ca96266082028..f323a10d93b6b0b0fb40fda30d64b2cc871bde12 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c0ee1efb333a2d1fffc03499ffd31475c523a2f72a1bafc7adff7481cd6bb559 +oid sha256:51beffefd5a05dc7fb21d6f8fe7e22f4fe5ccb9e91f1038a829865d23820786e size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin index 7fb3a6b8628a0590c2d099088902732829c81bef..4d16c5dc094b9e80928facd7f9687d2b6d10830c 100644 --- a/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:168f0686219feabfd7985ae44027f4b62a75a7031d4795d7098ce9d02c251032 +oid sha256:bce33f116822eae9b8b4722529395182e463aad001e3a79d16808be7b00dbe19 size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin index be6988e7f0442be989c2c992105fba913bed415f..712dfb53db8d71f42fdd35ab6a04f54e098c74f2 100644 --- a/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:342fa912e6c7400ed8ea8b18c411f406a024ee0698026e1b25641814b7278261 +oid sha256:d803f9f462591e86f4ab0c448526fd033b3f461206d329cfeb14261ae12d77de size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin index eef91612cd54d4e571d33608d029e820201e441c..5f3894e648adde06d30962c22fc47626262d94ce 100644 --- a/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b22c7b2bcb868951760cab5ad05607942978b83f1f54e50269dd2a894b292ee4 +oid sha256:0bcad956e60d87582886abe3873b73c31c6421dccd07ee572bc3ebaef8b93c5f size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin index dd09ddac71aaa9f35cd7451b841a6f25dced2e4b..614d45147b5a0047b354d85f235fdf4130abf8ce 100644 --- a/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1cb27fec2c7867c8c1ebc9ae311f80dd146d9d35536fcf71fbb63e38a4fce3b4 +oid sha256:6558f786b4707e9a74cf3b309288f44bab2fe85d7c2bf63d8191ce5d7717523a size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin index b1c91c223f3228782e685c7e62ff2ebbf2037ffd..b0f227656d47bfca0ab0a2787f3829302a84b7ae 100644 --- a/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d15bdb5385f8931d59f913e96be21e5521149624139ef72e734f73d61af53c2f +oid sha256:63ac0aaab6fe41d627f6cc07bb5e3441fe952761555f12f828a71b26612694b0 size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin index 46fb71aa861b7668ca122a9b092d5faf0a1d04ec..417d14c4809236cd526c40e84521d2f2ea9e0f1b 100644 --- a/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0217589c56e8bb040880aa2ce7ebdc3ac5f250b12b8a11787a253143634b5bac +oid sha256:3bacc7a7c0e98bfaaf14ba92c4287fdc929b5abc536607a4ac005d7f3c9fc06f size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin index 909c74b1ce7af342daeccb8b7c39bb4a63c1319c..65bdef2f71ef0b7e925de83f36d921c8f64ec97d 100644 --- a/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1ee78fe8bdf9a01d8f82e6a22aa1e182407d7d4670a87d5e21bf2a34fe442d3 +oid sha256:a3207da1809eaa7cd2cdb75e16ee500c93759b4dd5e45c39ca8f239312fb50c8 size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin index d177a83c7fc07d9a7000b817c0b8e49adeccc7b5..3755b2d8222e761799922adf95ff3f77b3a33216 100644 --- a/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e38daff351bac7c1f9b9a4f7295119cb303c7037e12027fb8a36effbdec8190d +oid sha256:d6a96d8269d69aed28e0b1e4bac833243793b2979d819ea9e307efa2868925c7 size 4 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin index 484f6bd56f24ea15529384ebdb4e21a442dc67fb..22d753b55db35a8bf5730e8e8923b2e2b5ce908b 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7758b963a9e36525d1d6d49027aeab3647ca6c3b9a60dce81d38ac5cd041fbdb +oid sha256:5fbdd191cb5c5b15dd436bb0eb61d75f4dd1ffcb139d867e7ec1362a6f698d78 size 16384 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin index 83cfba231ffc922efa172b8cf64c3dd8afce5a5c..832a9a421d490be70771bf56cd26d611c07e35a2 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ca50cff4086a68e7b381928637256fbafa7ab0b4d7e7db18c98ff7bd58424879 +oid sha256:324d5b0baa2bd143549f6b876e4847bfb14df87e6f4c5f2ed8c38f80f7a1bd60 size 655360 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin index a2b3898406936a6bab8a6113db01cabc08abdcbf..a581104adeee335f533f51d0cc949cd2881e65cd 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b34e67e0bd1804287bd6304f8909fbcabca41c8e33148de56b51cd82bab0de62 +oid sha256:a981bf8cfaae486dd857b1fc89be565b3858c02e7fd79d6213ff125ca715fe5b size 4 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin index a7e80782f7b8d3536adc4fc59b028722a883533d..73862cfcdec0537eb11ba932b35f45de51047bf7 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b280eafca25a670d2e9f3ea5fee996077207399ced3a43dab27b982a316bb5c3 +oid sha256:c8d46fdf1ddf2b1b8aaecabaa8e43068f74bb265db62ec27e7203ef055f8d3d3 size 2560 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin index ef1f6f1c258042243a67c2d73f03fed88637a3e1..9d0acdbf898f0fa7396eea1bd867054ae7a4a07c 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a1bb7afec833a278d841fef92fa2aa4144638247087fbcab89f9a664dbd16013 +oid sha256:d11e2e2807b998655988a6994f40b12f1147bfcb09e1d212a6ceddf86a8b9d70 size 327680 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin index 42fe92339cf1af1178f897650f1e8af7e07eb427..b81396f92e7b5e6537297aa2e412b3078d2c114e 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92b557a7c755ee619d71c405bafc0e40db3d479fe5a6c9bdb7379d5f212e6904 +oid sha256:9d419ffd1604b3adb24e2f51c7707ad3bb3865beee1f25bf19e584c09768b3f9 size 4 diff --git a/layers/encoder_0_attn_w_k.packed_weight.u8.bin b/layers/encoder_0_attn_w_k.packed_weight.u8.bin index 62e53bbe33dcc9aaf59df80b874fe4679ca7c60b..8f3b423d761e0c3db15e146655c3d68183ee4101 100644 --- a/layers/encoder_0_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f63ce5b91036dd26a20804e19e3fbddb0ce8195855c9e802e16b4159806e016 +oid sha256:0d358351e42a919e6f41efc8d3d8220d202c7a2592a36b18b1e4039c0312c49d size 102400 diff --git a/layers/encoder_0_attn_w_k.scale_values.f32.bin b/layers/encoder_0_attn_w_k.scale_values.f32.bin index 563d75734f39c52244220e5bc1869218dfd356b7..3de43f1952844bb84ee9816cc53603efdd46a457 100644 --- a/layers/encoder_0_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d8473447ad8c185def4c9c3ff9c2d9d3eea1870c01697de407ffd7f06271127d +oid sha256:363a2535ff463d2406751ad619b676aaf8f5043f972b10829d70e5c5370541e4 size 4 diff --git a/layers/encoder_0_attn_w_o.packed_weight.u8.bin b/layers/encoder_0_attn_w_o.packed_weight.u8.bin index ac8e40c950cac439d58fda6de06d59daf8d7e983..32a9b9c7f0841c180d5cd02ee95f1c7044a018b0 100644 --- a/layers/encoder_0_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e68c975be66010affb7679586381681af5d449d90380aa8333bf01ce8c266c39 +oid sha256:83c19e24982850a0703bc51352e8d2dcf2d9c58cac17c3fb58815327b0117251 size 102400 diff --git a/layers/encoder_0_attn_w_o.scale_values.f32.bin b/layers/encoder_0_attn_w_o.scale_values.f32.bin index 59e782a86988a05850ef46ae1747b726c2b73d5c..ca77e93d137926244e618da59bdd3524f8b81537 100644 --- a/layers/encoder_0_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:29c8b68c8c6d1ed6f90d6e01800fa4da76dface1f032e86f807e07e6ce500150 +oid sha256:92e6c93ca7bf5dfca57fdc636156023c476dba44daa150855c770b191b2812d0 size 4 diff --git a/layers/encoder_0_attn_w_q.packed_weight.u8.bin b/layers/encoder_0_attn_w_q.packed_weight.u8.bin index dfb29f121e0e1453be9f3a6e71c358482cc70cb8..407c189ecfda62da8e5c9a963e5bc4e4930bccad 100644 --- a/layers/encoder_0_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f2eb1c46f31e66c4514bf852f88b348e101f0c5d590930219cf0dc628d206476 +oid sha256:951c976f47b39ba620a2703f97b02ed8e753ccd8bb95a9c61ed0911139dd9009 size 102400 diff --git a/layers/encoder_0_attn_w_q.scale_values.f32.bin b/layers/encoder_0_attn_w_q.scale_values.f32.bin index 7146ca6406aeb381527ddd2205c08cfc0f5ab9f6..41703350a4f30bc5604f9e9327cf4f77bb7928e0 100644 --- a/layers/encoder_0_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1b78ea9eedffdde48507aa32fda72ce0017963541a013b187aceb94fa9e221a4 +oid sha256:58f656d894a6673181860f8ec88093f0a6254b00ce39b1cb1e108f1615e638ab size 4 diff --git a/layers/encoder_0_attn_w_v.packed_weight.u8.bin b/layers/encoder_0_attn_w_v.packed_weight.u8.bin index d30ff4b667d173841be5ac5a611c3d44d3cfae87..5eaeed3f134d620ed27227299e63407b97918e4f 100644 --- a/layers/encoder_0_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11bc624dbf8bd0c250e711eaa29632f9d3348f21c9b3c9d993c908a2476a0d48 +oid sha256:5f2fd0f6297addda94dfd003cc2902fbce3b926e9d3ccb9fbf56f118ba987bc8 size 102400 diff --git a/layers/encoder_0_attn_w_v.scale_values.f32.bin b/layers/encoder_0_attn_w_v.scale_values.f32.bin index 8200468ceb2162e4de99f5abfd9b80d2458f6df1..25372cd53fa79954dcb28ffdc0ca963dcd4ea49f 100644 --- a/layers/encoder_0_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:126404b59d4db50a3fb6fbfb0cd22a8ad394b3a2181ba9f0f189443d7560db56 +oid sha256:834cb863484c883b449cc141b0d11a1441c8d5d4c6c00b76092e54b1b9726ffd size 4 diff --git a/layers/encoder_0_mlp_w_in.bias.f32.bin b/layers/encoder_0_mlp_w_in.bias.f32.bin index 7d2bb1eb14132c4d461e09099a3f9948bf73ecd5..ead6960de9171ec5fae21b03b26f1ea5257adcff 100644 --- a/layers/encoder_0_mlp_w_in.bias.f32.bin +++ b/layers/encoder_0_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:73208703f263f727756bd48cbd994daa526006f49f7a0b5081f0fec0390c6262 +oid sha256:3a2cab48442eaf53044fbe153c8e3688fdd3ec3c035f8edeeaf67d3bcddaf4ff size 16384 diff --git a/layers/encoder_0_mlp_w_in.packed_weight.u8.bin b/layers/encoder_0_mlp_w_in.packed_weight.u8.bin index 6fde33a98886b41e27d3163ad6645b01f69383fb..674fa3acf782c8c9f2b0ae9df6ba757a5693c249 100644 --- a/layers/encoder_0_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_0_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ab9b1aebe99f1dd0c8c67488d9d137e540f1e11c6b5b8bad401c1ea126ce834 +oid sha256:8084c90cad779fcfbf3a68dd3d751dab75a495d6798f8d125b67ee076582c72a size 655360 diff --git a/layers/encoder_0_mlp_w_in.scale_values.f32.bin b/layers/encoder_0_mlp_w_in.scale_values.f32.bin index 11e38f5c0ccf629d1022fb4d8c40be505d2aa35a..02c1c819a6ad7e2fcca6b7dd8d1dd8e28ec4e422 100644 --- a/layers/encoder_0_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_0_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77cc54c25fc58c33ae5ac086bc2f27f02eac61df14eceac3e8a03410bad8b7f2 +oid sha256:fc25f4d74c3d8a0be61dd9b7b006c93e806bc6dc048c05e98596e8542c1327c8 size 4 diff --git a/layers/encoder_0_mlp_w_out.bias.f32.bin b/layers/encoder_0_mlp_w_out.bias.f32.bin index 0f54bd6dfe02021d8dacb70ed36f87609ea3f662..527e989d1ef91566d8c228d161341c0c2c446b25 100644 --- a/layers/encoder_0_mlp_w_out.bias.f32.bin +++ b/layers/encoder_0_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ed49c800405f2b13ac01856aed66154cd2e1aa6405de541986706eecb22af8d3 +oid sha256:6d95b0054d8d8c155e33665b1fb3c0dd454478ad2a95eba4316160883bdefd47 size 2560 diff --git a/layers/encoder_0_mlp_w_out.packed_weight.u8.bin b/layers/encoder_0_mlp_w_out.packed_weight.u8.bin index 9231de808d5251b63ce83bca98cde08d7a107fae..1eb16bb162078c0bb7e09a0459bca264ca14790b 100644 --- a/layers/encoder_0_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_0_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4b0d77b5c3e1e79d71ff659e164425aecde16daa9e9a480ab3b8ca044e5bcad5 +oid sha256:2b475a637893e79948117383cd9138d44690a04653e49985b355e6e63693a783 size 327680 diff --git a/layers/encoder_0_mlp_w_out.scale_values.f32.bin b/layers/encoder_0_mlp_w_out.scale_values.f32.bin index d6aad66ace7aff98ab21187a6992d6dc9f8fe22b..45d2f02ce80d6ec51eeb85f00c39c315907dc5de 100644 --- a/layers/encoder_0_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_0_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e53add4a0b7ab6184f4c36e38a5931859ecc3549c4c5de76131356cfb8b70ec +oid sha256:827241212e161c00a58bf08aeb8e001a475599cfb6786c2945b15dc39afe3dc7 size 4 diff --git a/layers/encoder_1_attn_w_k.packed_weight.u8.bin b/layers/encoder_1_attn_w_k.packed_weight.u8.bin index 37e0fb13443ad286144b3faf95c0ab6c3f01797d..59fe38d9c74b082bc5a522f1457d54fcf7da91f0 100644 --- a/layers/encoder_1_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a94892001dbbde4f76f2bb974e8e5f1b016c8a1c7bedb4fa599e6d98e6a3f862 +oid sha256:27b7e94565efaf4b3c1518f3862c56328a9e2ecb594cdd76f52e8ecd87cbaeb2 size 102400 diff --git a/layers/encoder_1_attn_w_k.scale_values.f32.bin b/layers/encoder_1_attn_w_k.scale_values.f32.bin index 7ba1cc30999f5f1acf02906f6c08f3de176d7adb..b605d00d3609e305f1c23a2aa45416d677d4b097 100644 --- a/layers/encoder_1_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:af573c1fcbaf6ed8e00ecee3be2df83045a17316c10bbc1204ec5d045243e648 +oid sha256:8e90310d7f602900c61d1ec0029aa69460d20598de178d6755dd8b6c42b109ba size 4 diff --git a/layers/encoder_1_attn_w_o.packed_weight.u8.bin b/layers/encoder_1_attn_w_o.packed_weight.u8.bin index 076ae94ff15b7e62842f4b00f9e6aa982835b585..b04d79240c774e6da71d3af2b012e6050d4d2a9d 100644 --- a/layers/encoder_1_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f19e5897cb1f6b93eafa7777649e0d337bc230a814b8ecbdbf81316e4e448309 +oid sha256:e1d4ba087cb7fd9337ad647b9ef35af6ef83ef1a9e2611f177e7e76cec268d67 size 102400 diff --git a/layers/encoder_1_attn_w_o.scale_values.f32.bin b/layers/encoder_1_attn_w_o.scale_values.f32.bin index c5222dd32e12e1c552149ea7d58c90a80d06e98f..a9c317936a7ae2dffdf4f62434397553bea772f7 100644 --- a/layers/encoder_1_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b016b418d7fc1745d3617cbbc7b69aff439aeabd33920e142ddc659297ef3c0a +oid sha256:94401ac4905ab9a6a51cd297f505caa81434ed03ba406ef6a8cc3e1759b2dbcd size 4 diff --git a/layers/encoder_1_attn_w_q.packed_weight.u8.bin b/layers/encoder_1_attn_w_q.packed_weight.u8.bin index 72983331195a8f8defaa8df9cb8f59109a31562a..3ea902f4dabf0a83eee3730cbf16def49b2f83ca 100644 --- a/layers/encoder_1_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8940fa8a4deb50d60c9fce77c30bff8e9cca946bc31abf081c2375570a288b2d +oid sha256:abe92f5a662e92da5725883968212a2e90a77f05e8499dd0eb5c3134279535cb size 102400 diff --git a/layers/encoder_1_attn_w_q.scale_values.f32.bin b/layers/encoder_1_attn_w_q.scale_values.f32.bin index 6daf982aaadd20d3aec0c572400bac899dba89bc..49bb85e3b3606634a2c6700ae93891f9e0532836 100644 --- a/layers/encoder_1_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:29b3b5b9328009be6b021713f0759c18c17a06ba90b3ef71a6e863ee0918be5a +oid sha256:f92420a0087a6ad79021a64f1300eeb7d53c4146df1e5f92c339fdd606d4808b size 4 diff --git a/layers/encoder_1_attn_w_v.packed_weight.u8.bin b/layers/encoder_1_attn_w_v.packed_weight.u8.bin index 61cafa1f20e2b0f2117924535dc23a3f1e5dc857..01936bbb65b84db4afec8ea43805531459cd63a9 100644 --- a/layers/encoder_1_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a01f6835913c38e63770ae5fe0ab82479ffc2752577a6eb44d24af3e00d6587 +oid sha256:fe4fc47da4a97ad0fd49c5dcbb7175aec7a0d2f7fa4f9f82c2703ca88cd13b76 size 102400 diff --git a/layers/encoder_1_attn_w_v.scale_values.f32.bin b/layers/encoder_1_attn_w_v.scale_values.f32.bin index 13d52863528c4e04ac24ab500ced86cf1cdc17f0..41ea50bb3c825bae6a05b3f44f9f7f6f2a9706a6 100644 --- a/layers/encoder_1_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:47b1d24599171b0027ee130ebf038f4b1694a326f7d6a783678eedcccadfbf3b +oid sha256:b2efaab082de4926716917ed6472d67ead22eaf2c71ebdcae672069a4acdf9fe size 4 diff --git a/layers/encoder_1_mlp_w_in.bias.f32.bin b/layers/encoder_1_mlp_w_in.bias.f32.bin index 092df7511fdad1c1530acfaee5db367b1e0de43d..f26d9732d3acdfc366b610a5e0da1a31654bcd26 100644 --- a/layers/encoder_1_mlp_w_in.bias.f32.bin +++ b/layers/encoder_1_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:76f3eb35f85ad10508ad5d77d1d368ef3aa6f9fd05e8855de5bb591aea755975 +oid sha256:025bae5bd7c6d3874c23d1348d4d32d7a5c399e719416f1b22112784599348f0 size 16384 diff --git a/layers/encoder_1_mlp_w_in.packed_weight.u8.bin b/layers/encoder_1_mlp_w_in.packed_weight.u8.bin index 2f07501b7a64cd6f6b668ee0e17d4264c5bb86ed..b96adf9c5b5efbf5874c691042f4fc8689ef5039 100644 --- a/layers/encoder_1_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_1_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:34a577f6ad2057bb305520709eeabda752495cd4fb693589c61f70a6783eeef3 +oid sha256:97ff605bae210a9b872523f788aa25bf06ae8da80eb62537ac6ba898ab0cd4aa size 655360 diff --git a/layers/encoder_1_mlp_w_in.scale_values.f32.bin b/layers/encoder_1_mlp_w_in.scale_values.f32.bin index e1dbdfbbb0995da5506c440eee424814fba93f21..7872341c42242375f88cf68f62c1ca20961c3e98 100644 --- a/layers/encoder_1_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_1_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0aab2d4afd974f7590fd6bc26ba84554f25fdf581885f8c2933ce4cfebc8592e +oid sha256:b14e688ad3655e5d1c26fc671f68d4911632515459181f058a45f5cc218a7973 size 4 diff --git a/layers/encoder_1_mlp_w_out.bias.f32.bin b/layers/encoder_1_mlp_w_out.bias.f32.bin index 923cc39a9298afa7c7b7e8c8fd63fb668b807191..5db7d2719241d4114d8d5952b61e9b6037069824 100644 --- a/layers/encoder_1_mlp_w_out.bias.f32.bin +++ b/layers/encoder_1_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:144c6c1b2a8b8dcfad3773938ab747e78d26057affe44e238d073e9ecde4d0fc +oid sha256:44d5985a564ba0032aee0a81b081ba706266d8e085a12c7f44d688918c8f4811 size 2560 diff --git a/layers/encoder_1_mlp_w_out.packed_weight.u8.bin b/layers/encoder_1_mlp_w_out.packed_weight.u8.bin index 8d689a088f3b8bcf94d0c4a6564ab01e3b842ddd..dd0edfa94b369b394a9c753ea3ea370d12dd9c4c 100644 --- a/layers/encoder_1_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_1_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a5c8c3c81b509c6fdb649cc2e3ea49b1cc694ae6976fdfb721d49c474440692 +oid sha256:7742ee5975e591618aabc5105a207b0f78065d02ee41cc6b45ac88df12bb4c1c size 327680 diff --git a/layers/encoder_1_mlp_w_out.scale_values.f32.bin b/layers/encoder_1_mlp_w_out.scale_values.f32.bin index 143bda6e4d00208a49b5f4571438911730e357a0..4ea101333c51488f29697b1dc117b2b5fc6e176b 100644 --- a/layers/encoder_1_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_1_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:14782673a4a81e0073f5799d05e72677ba9b13ce33ebbea20066976706374f5b +oid sha256:d4519cac1203163e20411c81058fcc9e15b2715b873377d9867a23f75a878b8a size 4 diff --git a/layers/encoder_2_attn_w_k.packed_weight.u8.bin b/layers/encoder_2_attn_w_k.packed_weight.u8.bin index a2fca38570908a01f8957f7cca178b0138b07ac4..106b3a270000a0faaaa4590c06d703fd1eaf3713 100644 --- a/layers/encoder_2_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a8a9ec384334edc880f6185c64a8bff5589bbaad2837e7fdd01171273fffc8bb +oid sha256:32ed7fb622aff2cf751fbd3986344f581380fc2d004517e2b3b7ae111fd31bca size 102400 diff --git a/layers/encoder_2_attn_w_k.scale_values.f32.bin b/layers/encoder_2_attn_w_k.scale_values.f32.bin index 3733451f0646142db9034b8f2ad984a7164e17d3..57a0e0131721803e5756cdd97818510711560ae8 100644 --- a/layers/encoder_2_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8dd1eb0a4bd4d76edcb4df2a26bf09820b0823dcc01658344ff578826bf3a0be +oid sha256:8607a763ae93991b49232ae2fd052fc67c7709ef43d9074d8bd91c940a2f4217 size 4 diff --git a/layers/encoder_2_attn_w_o.packed_weight.u8.bin b/layers/encoder_2_attn_w_o.packed_weight.u8.bin index 2d635f4722b5a89d509f8872f48b250ba64a80c5..38068583e6fe1a3a7cb2acf7bcfec3f331fdff67 100644 --- a/layers/encoder_2_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8fcf7d9111e69f47f88f1c1c02447b2c07d4edda7830a62241ce46b52d6bfd31 +oid sha256:4cd3154e5a261d3671f9255147f5c7c123b89e391fa8d95d0e0d8f0aee5b6824 size 102400 diff --git a/layers/encoder_2_attn_w_o.scale_values.f32.bin b/layers/encoder_2_attn_w_o.scale_values.f32.bin index 9623a954668cef97ae002530dfd88f37ef8d7da5..a0c421e751599cc645b9ae2bba873e00846a61c0 100644 --- a/layers/encoder_2_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a48b17cd6544aead4b0d681a5bacb90b0fbb0dc0fbd5e9b43703af9d655fff28 +oid sha256:bd285179d72698f1f3ec0a18f279f4656df36d31c859f2b106ec8b01caa99dad size 4 diff --git a/layers/encoder_2_attn_w_q.packed_weight.u8.bin b/layers/encoder_2_attn_w_q.packed_weight.u8.bin index 028985bf547c5d9bae3ac7963018be2982ec4e9f..03d05c49bd7d34feb561a56a1b739891d070fcec 100644 --- a/layers/encoder_2_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:728cff4693aaa8b3412cda55a9c5eb3cd34fa3319fe0d32b47e769b67acf27cf +oid sha256:4046b1503f400adae06277ce337563059601462ea3ed824adc1143d2bbae8d25 size 102400 diff --git a/layers/encoder_2_attn_w_q.scale_values.f32.bin b/layers/encoder_2_attn_w_q.scale_values.f32.bin index 227e2d4a87562e14666178f0945b06eac2d694d4..62a113a5d7d3b0078f34722db50d5a3ae92f38bd 100644 --- a/layers/encoder_2_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a676145c71d793b31b8e1c700433b6c5ee619abe5781ae6a7f3d3138ebfc6790 +oid sha256:b6a2a79210118706fe89b4ddb96a41eb06075852ab1c209cdcab1652caa3907c size 4 diff --git a/layers/encoder_2_attn_w_v.packed_weight.u8.bin b/layers/encoder_2_attn_w_v.packed_weight.u8.bin index 49b80a30f64f243d21a69d741f6cf5ccc0068ec9..f52d34fe92db33b36e95f94923b12428033f7154 100644 --- a/layers/encoder_2_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:556bfae148c0efc3fe914cf102c008342ebca522e62edfd5b2664ac32aa70c06 +oid sha256:64940ce687d9f5cac4bc5c0ebeedaecb3e8551bfaf05135a27c04b4158b9b9f2 size 102400 diff --git a/layers/encoder_2_attn_w_v.scale_values.f32.bin b/layers/encoder_2_attn_w_v.scale_values.f32.bin index 366dffbc929f5316b3c25bb51d3661f49498a923..ac6c7558323da05185f80c170e42f0442efbd692 100644 --- a/layers/encoder_2_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5203a15a236be8e0d05745452f1eba88b7ee04fc550a31b0839d4cf3bd15a90b +oid sha256:17eb0fc4ae802ce844e776193fc48d96664c74682bd8ed65f0659401c25ccee2 size 4 diff --git a/layers/encoder_2_mlp_w_in.bias.f32.bin b/layers/encoder_2_mlp_w_in.bias.f32.bin index 292d0e4bfe969dbee27f3865de53f722867ef6db..3054fd42dd7aa5be5fd0480dbb4b1a8f60518951 100644 --- a/layers/encoder_2_mlp_w_in.bias.f32.bin +++ b/layers/encoder_2_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:55f1ac5b29cccff2b7c2e26766f16f4eb81173f165d889b6c484a41b7adf6020 +oid sha256:756a058396dc773b98e7fb45c72299bb1402b3a7f4ff319a435fdae1a5a14a0d size 16384 diff --git a/layers/encoder_2_mlp_w_in.packed_weight.u8.bin b/layers/encoder_2_mlp_w_in.packed_weight.u8.bin index 9bcec8300f6cca55827ebbb8bfee50b09135f31c..9500d132ade6955a2a2e5f95c4f8510968a6094c 100644 --- a/layers/encoder_2_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_2_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d644ee10bc3b7f73bfa320283405780d256ef4809748bde34fdeb899369685e9 +oid sha256:5c27668c24ade7f4989551e3a23c729512fa3399126e8131a9a7c3b7beba93f2 size 655360 diff --git a/layers/encoder_2_mlp_w_in.scale_values.f32.bin b/layers/encoder_2_mlp_w_in.scale_values.f32.bin index 763eebd69694e56e54fa847783aef0bba1096180..6f92fef71e02546b77917aadc78aba2f48a49c13 100644 --- a/layers/encoder_2_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_2_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77941e8d1c33bf8e9f73dfb3902ddaba54ae2b4c9d33a14b40affed7a230d658 +oid sha256:ea11ebc8e04d3fa09dad49efbb2465b461308a8353d1fddf1008c25cf47b1f49 size 4 diff --git a/layers/encoder_2_mlp_w_out.bias.f32.bin b/layers/encoder_2_mlp_w_out.bias.f32.bin index 553783d9876c960f1a1dfd7de06cac4f3378eb16..14ac064beb110180f59f52f5a214b82f72a0ceb2 100644 --- a/layers/encoder_2_mlp_w_out.bias.f32.bin +++ b/layers/encoder_2_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bf765646a81720449bcd584215038473a9cb7ef7125e4cfba5cac598127e67fe +oid sha256:1a85a10eac9d0a55eec02edf2e3b706e87066e836808c100715b883e65689cc5 size 2560 diff --git a/layers/encoder_2_mlp_w_out.packed_weight.u8.bin b/layers/encoder_2_mlp_w_out.packed_weight.u8.bin index d0ac09b0b6d97ab1d7d44060b09e482460f40b88..370f4a15fd7cd6ffa63037c4e215d072e9ec8ea0 100644 --- a/layers/encoder_2_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_2_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5ff72ecd699899e9a4ea52137bd662ca80a3272f8e51f2a98c97a6be25d4235c +oid sha256:dd26321691449af82d643801b9262dff7365260cc32b665c25dee5889cd4df69 size 327680 diff --git a/layers/encoder_2_mlp_w_out.scale_values.f32.bin b/layers/encoder_2_mlp_w_out.scale_values.f32.bin index 0d9f2a94835098ffd00d1ad31951ec2321fbcbb5..5142ca31d8f0bd31a7defcfbd69d5fbf269cd7f7 100644 --- a/layers/encoder_2_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_2_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97cbd68d328e18fbfda32667ee470c3aa4eafe78bd0b78b995f2bfe564bfcca3 +oid sha256:ca2d4e4c3da8b0e7a0ab688a4883b2040bebf1e22d545576a795c847e5ea2b28 size 4 diff --git a/layers/encoder_3_attn_w_k.packed_weight.u8.bin b/layers/encoder_3_attn_w_k.packed_weight.u8.bin index 09f15c9d97436b705a8ad8ac3e9b29494b3350dd..6c34082e9155ab1deb5db7313ff629f5e453e078 100644 --- a/layers/encoder_3_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:615881e833f29f120b78dde432d5328a8447ae9d1c08b242f523be3d019382d2 +oid sha256:5a9a3e87cb0ccf9381821b2c13cd09a88996d04fcd808ae3b6313622c9986444 size 102400 diff --git a/layers/encoder_3_attn_w_k.scale_values.f32.bin b/layers/encoder_3_attn_w_k.scale_values.f32.bin index a8438ccbed1bb70bb5664229dbadaaf2c98381cf..8a8df4be3be301eafe1381a75835ee842e1cf042 100644 --- a/layers/encoder_3_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b45f07b7955b4ae7104c7df0c5d3fa813bf7125a8768ad0741d10a7acd3218c8 +oid sha256:c94e97d5feb0a8acb690700c648981cd8ddadef54399a0a263cb112141cea08d size 4 diff --git a/layers/encoder_3_attn_w_o.packed_weight.u8.bin b/layers/encoder_3_attn_w_o.packed_weight.u8.bin index e08553db5bd4e57e0a27dd3d02c607abbaa58b07..f0c35cdd2bf2b90cbd53dca3c281ae5be4e86b1b 100644 --- a/layers/encoder_3_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:670e7caebcbd937e313590599bad83fad1f999d2e4256a21dee1119293d069db +oid sha256:6291c1abeaaea0b97649438a296d76ceb106575b71884102d3542b00ef05e8c6 size 102400 diff --git a/layers/encoder_3_attn_w_o.scale_values.f32.bin b/layers/encoder_3_attn_w_o.scale_values.f32.bin index a31c7ea44e9751f088135618449201b36326f7af..23db519bde52fa46c457011b541cb878898665e8 100644 --- a/layers/encoder_3_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8b688d988ba3c12fcbe0b2cd81b3140a2a7403d7c986f99a0398856152282ae1 +oid sha256:bd39061fcce791e35176cff9de492ef93343a6c39e27730e241ddedfb549a768 size 4 diff --git a/layers/encoder_3_attn_w_q.packed_weight.u8.bin b/layers/encoder_3_attn_w_q.packed_weight.u8.bin index 1efa0ca3ce3513f1ddd295cac1b195539f7d6f9d..146eae7ebac54fabc69dc5f3e51d63d970eb95c7 100644 --- a/layers/encoder_3_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:93a3d233014e43a89110fdbcd913ebeccbee67222bc170bdc097e5d1a14f790b +oid sha256:baa0d119c263884f0022dff7e7e4020996ea2c91c9912f568f2ede5559432027 size 102400 diff --git a/layers/encoder_3_attn_w_q.scale_values.f32.bin b/layers/encoder_3_attn_w_q.scale_values.f32.bin index fda6041c0bc8edbd630b9fa12fb540725a4efd54..97adbdcf542f508c8ec04808da791726834f9055 100644 --- a/layers/encoder_3_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9228202b5e7125cf5b8bdc0e53498cb8165e7130b718a59da5d6924ad99173c4 +oid sha256:adad57af78e9167da8b4e5855e46083456100ffd1ed101e0f84074e9496c7d27 size 4 diff --git a/layers/encoder_3_attn_w_v.packed_weight.u8.bin b/layers/encoder_3_attn_w_v.packed_weight.u8.bin index f7fee66b7e87f93e508fc7cecdfba54304ee376b..89249e1ebb56c4eaaa06506998507590c473691a 100644 --- a/layers/encoder_3_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7c3eaad05215d7ee91070277ad7518baa3fd19b900c5b2c6ea621f51f8d7e577 +oid sha256:2bd7d1359728efce205ef25d36c8d47b7ded204343a3074ca03ad64bb485ae42 size 102400 diff --git a/layers/encoder_3_attn_w_v.scale_values.f32.bin b/layers/encoder_3_attn_w_v.scale_values.f32.bin index 00f0f2469ac7a32211fe1d9cd37a24df7bc25f53..2a0e6d3bd5e2711d87bbc687e872d8a14f01d5f0 100644 --- a/layers/encoder_3_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:350d62ab7cd78d7c07e33dda62d04dbbb68586a00b5fc3d7cdfca3d59117371f +oid sha256:f7b3d178706d789bfbc5ed3419c8abdfce30d733cd967d5a7ce3f92560ecb7aa size 4 diff --git a/layers/encoder_3_mlp_w_in.bias.f32.bin b/layers/encoder_3_mlp_w_in.bias.f32.bin index fb994b71b235a2e75d75ee77ce59257c2af5b7b6..091b4f43a2dd2592cbf03a05b7f5856080a4ec53 100644 --- a/layers/encoder_3_mlp_w_in.bias.f32.bin +++ b/layers/encoder_3_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b94e5c80466ca951ccc2ce5e34b000be946db165d23abc5eec20731ce507504 +oid sha256:fd93590315d0550dadb82709589d499011558085fe7f42aa87a41a87c2742e9f size 16384 diff --git a/layers/encoder_3_mlp_w_in.packed_weight.u8.bin b/layers/encoder_3_mlp_w_in.packed_weight.u8.bin index 840980ca914cac6b40b3dc2980ca2a698d022090..af94632008d6de220aaef5f6a1bbe835009ef1d7 100644 --- a/layers/encoder_3_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_3_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db06ff658696f3c55e103c70b7e2c0494f68492ec148363b0c06f2c2e64da426 +oid sha256:8b117e51f471d478c8c5da5e498e0635c1ce74b32e75e4d923b6485ea87353da size 655360 diff --git a/layers/encoder_3_mlp_w_in.scale_values.f32.bin b/layers/encoder_3_mlp_w_in.scale_values.f32.bin index 4108acd54e19982f607c39354c844c321e49a322..be020300e1942af581af12a50b581bceb9568add 100644 --- a/layers/encoder_3_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_3_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d08e720749c4112b88d0fe34674fb6851bd5ec321c3e8ac40d4b157cc60c99c1 +oid sha256:49e75f99e2d5f25276cbb411044e6acc42c8b520b449a0e88d0f36927fdb3b9b size 4 diff --git a/layers/encoder_3_mlp_w_out.bias.f32.bin b/layers/encoder_3_mlp_w_out.bias.f32.bin index 7b33ab584246999c28202307501c4e4b37a68d60..15296d365e08149f63b4e1c52b9b26b81c3beb79 100644 --- a/layers/encoder_3_mlp_w_out.bias.f32.bin +++ b/layers/encoder_3_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:44865713fc16e41e8061e1be0678e07e8f85157d5c540b51c9a79b52090b1cbc +oid sha256:0f4777ca7ed1def47f66c0c13245e859f585b3401bff9b2fc0692869bcf6c3b8 size 2560 diff --git a/layers/encoder_3_mlp_w_out.packed_weight.u8.bin b/layers/encoder_3_mlp_w_out.packed_weight.u8.bin index 0f0941202d3d935249b07943cde106b0b327b314..ccda21a748c8a50b99ad56bfbf253c7d2bc0cd68 100644 --- a/layers/encoder_3_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_3_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e5afd5b12dbc0a921c3d5be92f444c00e9fe35514919ead5113bfbefe70eb423 +oid sha256:3ddab3f329beb5d19a28e69aef00ac69b708a6696f78e84254033d362b4cff02 size 327680 diff --git a/layers/encoder_3_mlp_w_out.scale_values.f32.bin b/layers/encoder_3_mlp_w_out.scale_values.f32.bin index 34c1ee20efc526a1a74d097407c2e8b8350433e7..4a38596d5943df0453ebbc2f9b781eb520713c3c 100644 --- a/layers/encoder_3_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_3_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c245c034ec27db041b7a2cc308dab23a6ed2db32a09af0fb587d2826dd8e5db +oid sha256:fc14d3937542e30e559658d7b9bb2377fd78c81771e3f3e7cc20c690648ea7b4 size 4 diff --git a/layers/encoder_4_attn_w_k.packed_weight.u8.bin b/layers/encoder_4_attn_w_k.packed_weight.u8.bin index b0509fe1f72e83911ba25da294ddc34759632f88..d2f093e15c6e353dc8b83af106c28a0c2328d39f 100644 --- a/layers/encoder_4_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2b50baad9a382d17d6bba2109fe7c7afd6c658bef1533c4fe2d534ad427f7c43 +oid sha256:10a703b02e24bbfaf3495bc1425befd4a89e9c6f09744e2a1c0706355cbcbeec size 102400 diff --git a/layers/encoder_4_attn_w_k.scale_values.f32.bin b/layers/encoder_4_attn_w_k.scale_values.f32.bin index f0a874a5bca9a0be0c01b07a70a900f43f5edea1..a97e498f52d4a7da74bf2b0fca9354aa4499e506 100644 --- a/layers/encoder_4_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9025f9bd080125d7499f6b4a768e6226046f736c06332055fc868f48b89f3a46 +oid sha256:531f130bb155c8228c57f8775050b5bc55fe608c07b428bc621c7a2397638773 size 4 diff --git a/layers/encoder_4_attn_w_o.packed_weight.u8.bin b/layers/encoder_4_attn_w_o.packed_weight.u8.bin index 0ae984824c4612b5390c970fe90a6872b5a69454..a5b339ca826767360de5a5f1791b61a844413b2d 100644 --- a/layers/encoder_4_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:70bd484dcdf0064d9638b964c017b1da8bc62a86534a7aad8f4637f467b17ec6 +oid sha256:a94d196e77a98f4ed95df7a9102b2991e536dc5f3071302b1a497fce6d5de673 size 102400 diff --git a/layers/encoder_4_attn_w_o.scale_values.f32.bin b/layers/encoder_4_attn_w_o.scale_values.f32.bin index 8e1433407f79ae34a287f6555d5d1e149ff7d9b9..e9eeaababd7734f88d760050e13a6636c7a2d271 100644 --- a/layers/encoder_4_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0edd3e4c033ed0928aae622f4c279639a88e324bd180d1b7f2a86a0ded3a7f2e +oid sha256:65dafd5676fdc4978472be0e5ffecd6e5ec5549fb6d5664b79e8d02e4cd0878d size 4 diff --git a/layers/encoder_4_attn_w_q.packed_weight.u8.bin b/layers/encoder_4_attn_w_q.packed_weight.u8.bin index 732ae7880593b450c381e4cd4f2fbe7d79e56b98..955fcac36dc7a86e2c89681ad42885cbd1d9b5a9 100644 --- a/layers/encoder_4_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a745262c6dfa925e52caff29d28d589cc7f9a0de2fc31b66b1193d884a086c7c +oid sha256:728a805cfca6f97949f88c31871ef1be00603a46d9bf20fbbeaf9a63ecd92167 size 102400 diff --git a/layers/encoder_4_attn_w_q.scale_values.f32.bin b/layers/encoder_4_attn_w_q.scale_values.f32.bin index fe35b8b19f220aeb04288600b4f77a25ec0d824d..e9a3646a8d1b5d8f2d87659a5c9ec939943a804f 100644 --- a/layers/encoder_4_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:018d0aa83591d3aedb9e18e578bef80d29a0c8b145d07831baf7736115ad6102 +oid sha256:3b9e454e60a6a13e5102da4c03d527762bcf2b9bf12d486e799d61c3658c8dcd size 4 diff --git a/layers/encoder_4_attn_w_v.packed_weight.u8.bin b/layers/encoder_4_attn_w_v.packed_weight.u8.bin index da5a27680fd13a6b58027900d8dbd7192fa453fa..5e5368031d058d5a3fcb4cf3ea1b7790598bb355 100644 --- a/layers/encoder_4_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90309d347ca7a149c7aec39fe41ca1281b0981220a4d9d7e81ff92a6838ce3bc +oid sha256:e5d4f475baae4060d3cc5a3a82f3a52ad92447d23710c3bb3577d99a02ce890d size 102400 diff --git a/layers/encoder_4_attn_w_v.scale_values.f32.bin b/layers/encoder_4_attn_w_v.scale_values.f32.bin index 126bf4b58c06e308f8ef517724c1f455e0b35a4b..c827aba161ebb721e9f4aaca18371927139c793a 100644 --- a/layers/encoder_4_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:62dcd2181659d271311c3f48d2d30ffa824fc90775ed78243af216b5e5dfe17f +oid sha256:8dc5c14c4a1ce0a7eda48fedb3496c154e2fd035b372b8c1fbb67ebfcbc3ad95 size 4 diff --git a/layers/encoder_4_mlp_w_in.bias.f32.bin b/layers/encoder_4_mlp_w_in.bias.f32.bin index b0a2b027ba678c6f4cb74b15799fbc8a3a51b1a5..817eab5b9e864a0732342b106f564fba6bb651e7 100644 --- a/layers/encoder_4_mlp_w_in.bias.f32.bin +++ b/layers/encoder_4_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9af5a6606f55fc82f725d4cc9ce177d34a22ea92bade6df259d63436380fedad +oid sha256:1895bd3a783cadcce33598fd40adbec1468989bfb911673a0fb315883e21647e size 16384 diff --git a/layers/encoder_4_mlp_w_in.packed_weight.u8.bin b/layers/encoder_4_mlp_w_in.packed_weight.u8.bin index 98e576518b174a1a65e56e7b6a490edbd179023b..cf712baca10739bafafaa4a76c6b14e53827f5b5 100644 --- a/layers/encoder_4_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_4_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:330c9c65ca8995c4ee29fdd90955945bce2aaab71c92537223aea7aaeb0d6569 +oid sha256:9d3742046e3c417116c43c76a09c313d31979170bd39d42a5dde6f0a7e9ad08c size 655360 diff --git a/layers/encoder_4_mlp_w_in.scale_values.f32.bin b/layers/encoder_4_mlp_w_in.scale_values.f32.bin index 1136acb3d07ab12c4752036a9966071f089dfb73..d32625fc5f2f3f0a530a7ccfbe38eab8b31c9c9a 100644 --- a/layers/encoder_4_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_4_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03dd37152ed6956f01f128e4d651326b253d0a7e3b9a35a65070922e5e1a21fb +oid sha256:88b516eb6de001eed4819d59a8e8af51f48eabf45e0e08400cf7351198e404b8 size 4 diff --git a/layers/encoder_4_mlp_w_out.bias.f32.bin b/layers/encoder_4_mlp_w_out.bias.f32.bin index afcc542ec90341f01d0ad55d3b908c23495fa9c7..dbca2910dc95108914a5b0077c0b13030b088ce6 100644 --- a/layers/encoder_4_mlp_w_out.bias.f32.bin +++ b/layers/encoder_4_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c920b2e3ea660534d14bea1df49772cc1b36d4faa2316234ae134ef3e588e302 +oid sha256:a37f53e3778a72816f2020f1e2e74ce0387bf8f7f1894bcb5e21337b17a975a5 size 2560 diff --git a/layers/encoder_4_mlp_w_out.packed_weight.u8.bin b/layers/encoder_4_mlp_w_out.packed_weight.u8.bin index b58da887b9e17fcb1323eb059114c1a56ef3b86a..c2a9c68c43d6f25321cdb1fb34e5ba70354d0391 100644 --- a/layers/encoder_4_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_4_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:64b20c3eac7e24b676d7808230d57df66f48ddfe2627d40f5ea7ca8818d0535b +oid sha256:cb2919b644968c18f3d8d07f4a7c2dff37300f3a19ca9252d608515e27356843 size 327680 diff --git a/layers/encoder_4_mlp_w_out.scale_values.f32.bin b/layers/encoder_4_mlp_w_out.scale_values.f32.bin index 741fa7f8f0b9b44276d17d9b355ed57fb3d165a0..f7f323a381aa3ac52b0d7b3d205a6a7f15366c10 100644 --- a/layers/encoder_4_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_4_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7c930bcb7eb3ae14e26747f63a85e3bc9b5d51910ffefdcf0aed5f03081187c5 +oid sha256:acf932162b73f02f4dac3a61e9fbb063804e282e457542dcb81087ac0288e496 size 4 diff --git a/layers/encoder_5_attn_w_k.packed_weight.u8.bin b/layers/encoder_5_attn_w_k.packed_weight.u8.bin index 172ea765bf6dfe57125231ee82bfe18ad011a422..9e971bef6e84cdb081824c50b26dfc985588739b 100644 --- a/layers/encoder_5_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bdb31459fec6790046f058ff5417102ba655f3a943cccf66396236fa663f14c0 +oid sha256:6050252cdefae7097fef44b72a46832ef84555bf3129e31fb1706699b54fb993 size 102400 diff --git a/layers/encoder_5_attn_w_k.scale_values.f32.bin b/layers/encoder_5_attn_w_k.scale_values.f32.bin index 7e3e136fede825ab5509cd566832817564f3b4dc..c6d644ed0cf339dbbfdd8a8172434fa07c87fcc6 100644 --- a/layers/encoder_5_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:933fac989d60e00f6148fdd80406d4d8b0ef95e2bb1c5bf0bb7d6eeabbf50325 +oid sha256:821f63202f456185ca334f8df5549720d54d696d62ed9ae84dfe0ba200913545 size 4 diff --git a/layers/encoder_5_attn_w_o.packed_weight.u8.bin b/layers/encoder_5_attn_w_o.packed_weight.u8.bin index 8ea0e8cd3b13b1a6f9818feda19421903a713499..a1c66e5c74c1848af40fb2a84780d3fe9563cc9f 100644 --- a/layers/encoder_5_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03fac26859771cd01d5af4fadacd835790eb7bab941be228b4bbfe723b31b03d +oid sha256:0c9021bc8c3337e9e07cdeac52581df7895492820dd4c39aa2a8fa0a170e21a0 size 102400 diff --git a/layers/encoder_5_attn_w_o.scale_values.f32.bin b/layers/encoder_5_attn_w_o.scale_values.f32.bin index 7e394c8c8e1993ec722b005f569151ebc6154e0c..68e2d3326ac37d4723994c0f19cdcdfeb4485358 100644 --- a/layers/encoder_5_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ec8adf1d1d949c1dc66df40b209d212892a4c0879e1c25a3683c676db9321e8 +oid sha256:79dcab88153ccd85a92bf06a820212da7514276d13c9d246b383731a60ad4278 size 4 diff --git a/layers/encoder_5_attn_w_q.packed_weight.u8.bin b/layers/encoder_5_attn_w_q.packed_weight.u8.bin index 46df59a061067321d8d296823a8e7bc310cef832..9dd19d1e9c4174eb503bdb0a49ff96d4a3788806 100644 --- a/layers/encoder_5_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17992f4e033ba3cadc4024b246db460439d524500fbaa3e80fecc32c072015e2 +oid sha256:7dd4d44c1ffabf832cb1a2de16b9fe41eda6fdab014995e14d8e985656429fef size 102400 diff --git a/layers/encoder_5_attn_w_q.scale_values.f32.bin b/layers/encoder_5_attn_w_q.scale_values.f32.bin index 575571c23f1ac5bd9375407d94c32bb5328c9005..a1aba102d49f63b0d05cb0c644bf47da788f2dd7 100644 --- a/layers/encoder_5_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dbce1773e2798fbe649bd5b896bdd54ef0e360df6c126fdf0d1c28733486cf99 +oid sha256:7624e04915864961ee93653aa33a552ae72de0f333aac4bb5070ee12d3164a02 size 4 diff --git a/layers/encoder_5_attn_w_v.packed_weight.u8.bin b/layers/encoder_5_attn_w_v.packed_weight.u8.bin index 0e0667958c963e891c5035963dc8d71888441b34..fb5c4e96283d2cc70e57df639e252be4bb9b04b4 100644 --- a/layers/encoder_5_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ef7c5acaddfb0083d3330e6b8f54dad6c037482910066c47374e42e8e756a303 +oid sha256:e53e30cf99dfb375124f09e4aafd8f94d002f350320d64ed184535c6494d67f7 size 102400 diff --git a/layers/encoder_5_attn_w_v.scale_values.f32.bin b/layers/encoder_5_attn_w_v.scale_values.f32.bin index 389bb37adc27357433a571cf37ebe50995b0e15b..2a44d74577bec42cff67d3c5674b384936944eab 100644 --- a/layers/encoder_5_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:51b137bb07bab1f7ae40e9693fa260009f5709a974777b2b4bd4bd8daf5f2e9f +oid sha256:f76061e291a207776605c5ad3c7d62fe4d33568ecc9033af6c0b627e411b3c11 size 4 diff --git a/layers/encoder_5_mlp_w_in.bias.f32.bin b/layers/encoder_5_mlp_w_in.bias.f32.bin index ec4838c5c03c89574ba9d227feb593a583cedba7..31b38c4cf5cb94634720199810e01f2a45fc6849 100644 --- a/layers/encoder_5_mlp_w_in.bias.f32.bin +++ b/layers/encoder_5_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b0602c6e9911ecf12d950fdbe9578826bece7652a4ffe3a4c4d09336867de439 +oid sha256:84867af91e82c506906ddb71b0a230680dd925d90773bb297b7fd5b0b7713542 size 16384 diff --git a/layers/encoder_5_mlp_w_in.packed_weight.u8.bin b/layers/encoder_5_mlp_w_in.packed_weight.u8.bin index 09d6fc45f417b666ab9f6d35e69f2faab06e4618..b8c7d948dfdb1eca98787185b824be07d2910d47 100644 --- a/layers/encoder_5_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_5_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:701ef35d26908f55fbc1c25559a106e3b9996c6017650de149acba30a6b452b1 +oid sha256:93f7b29f255947dd72d7a5ad15b60f2c68c4b3e148b922f4794bcf96bf7aef87 size 655360 diff --git a/layers/encoder_5_mlp_w_in.scale_values.f32.bin b/layers/encoder_5_mlp_w_in.scale_values.f32.bin index a3bc6c6ba83972ad17327498c8aebdbcf55a4da7..11fc70f486ba838449022e432eb6512876ed62c8 100644 --- a/layers/encoder_5_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_5_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:75b4b4d89d08840c2f4176f269224be79faecfaced1b6be41d285d0d1df7dcff +oid sha256:07471f0e22ba2cd8c2c7b735c203d91c874fc834b4209788a236fc9529247943 size 4 diff --git a/layers/encoder_5_mlp_w_out.bias.f32.bin b/layers/encoder_5_mlp_w_out.bias.f32.bin index 809638f08eaa29b090ce41b2da72a25c3aa3d477..15e444acd5d5c5778f3a1400a024662f3cd1ebde 100644 --- a/layers/encoder_5_mlp_w_out.bias.f32.bin +++ b/layers/encoder_5_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6131b28da40f02a17f49f84ea2dc74a0ce5b702e2f0d9eb4392ea28bb85c4e76 +oid sha256:d1ccf0c6e752d23d27842dde01b4bc430190dab45e3bfa8dd8417dfe4c13cb15 size 2560 diff --git a/layers/encoder_5_mlp_w_out.packed_weight.u8.bin b/layers/encoder_5_mlp_w_out.packed_weight.u8.bin index 1226b8976d792b5bbafbc2c1e11fc63ecf207d19..19ed6f7000c2a203819a43b518bbf4ac91c3da6b 100644 --- a/layers/encoder_5_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_5_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:83b2c60db531b3fa20066c2c4e1950b6900a7a27fb932eab96df17efd383bcab +oid sha256:5c8cf16a336ac7618477e7a52f8eb8b12d5bbd7004f961745f08abfb3f36039d size 327680 diff --git a/layers/encoder_5_mlp_w_out.scale_values.f32.bin b/layers/encoder_5_mlp_w_out.scale_values.f32.bin index c89c12c9603968e6029fc59bfbcac0564dd4d960..19b9b7a341a8f59419a3b10d69e9672da97e2386 100644 --- a/layers/encoder_5_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_5_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d06678dcf842cc83e25aa12695675d8abd59d0dd3002a6a70d8b6e78b53af1c8 +oid sha256:4587070b10b62cb7687541b3e9946824e292b8f024c39b9d388202d61a5244b4 size 4 diff --git a/layers/lm_head.packed_weight.u8.bin b/layers/lm_head.packed_weight.u8.bin index 348c54e044f61a3d6c58db2698ff8818a5c7ecf5..bfd326a4839e273efae95f0c1042a1ddaade97ee 100644 --- a/layers/lm_head.packed_weight.u8.bin +++ b/layers/lm_head.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f9cd1687384a4f22ee9b78faa44a3b66113095161374ebc91d6e6f9b60a6ea4 +oid sha256:d077cc31fb0f453749ee885c7dab678178e198916cf13735c2e8c621c200c123 size 1313280 diff --git a/layers/lm_head.scale_values.f32.bin b/layers/lm_head.scale_values.f32.bin index dd134bee714c16d6554a4c106bcaeb5806f86d32..823e70a5f09dfae7c1758a9dccf6ac3d89b41062 100644 --- a/layers/lm_head.scale_values.f32.bin +++ b/layers/lm_head.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1aea5df41f70ea50217f47189f39b5750d114865679ec371f3b68804875da176 +oid sha256:4a6cc0d1c16f482a50974679ef9b7ef620ed03cdf8354fde8a53acada716c068 size 4 diff --git a/manifest.json b/manifest.json index 0a29b2ce6533116e882e53ad6a799de59e160df4..f661ff039dd3b0267fa7a5087c5159cbd021d1aa 100644 --- a/manifest.json +++ b/manifest.json @@ -7,17 +7,17 @@ "structured_decision": true }, "model_family": "agentkernel_lite_encdec_v1", - "parameter_count": 110885888, - "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/agentkernel_lite_encdec_manifest.json", - "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/model", - "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/chatfirst_retrieval_special_compact_100m_from16000_train_17000/tokenizer" + "parameter_count": 113507328, + "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/agentkernel_lite_encdec_manifest.json", + "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/model", + "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/tokenizer" }, "dense_tensors": { "dec_embed.weight": { "bytes": 21009920, "dtype": "float32", "path": "dense/dec_embed_weight.f32.bin", - "sha256": "4f4e6de1db97417c8e97c5e715dd064b5c33c9e94702ac758166c94c5cef61da", + "sha256": "78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df", "shape": [ 8207, 640 @@ -27,7 +27,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/dec_norm_bias.f32.bin", - "sha256": "5a504281bfbf8814d71a0347d2f1b29da2384360eaa32e344ff7056e112b4001", + "sha256": "a52ba99331e084971ab8824584f8d5e7b308f7f6d5856c6732f8ca9e93e28cf6", "shape": [ 640 ] @@ -36,7 +36,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/dec_norm_weight.f32.bin", - "sha256": "39fa6364f4ec83f1fee8ad937aee196331d07d86c987e3c4aaea1d78001cb562", + "sha256": "88a7e373f37f1a051e48de5aab9429ae16992571a5ee4536db1babd73dfe3e69", "shape": [ 640 ] @@ -45,7 +45,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_cross_block_n1_weight.f32.bin", - "sha256": "eb1544f5768be6328f6561e7149399a50d6f25a523d6c9b18eb44e92546fc5c1", + "sha256": "e9c937f04235c2be29c729ccb28cdfb4e3bca8356921b61a022e0607831129be", "shape": [ 640 ] @@ -54,7 +54,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_cross_block_n2_weight.f32.bin", - "sha256": "076f5ecc86169fc36943250486b0081df382202af90259ffee7072fd74123fcf", + "sha256": "78579439b641dd9fdd660faa7775d54b5e3b73274a8ffdbd7c627711063d1d9b", "shape": [ 640 ] @@ -63,7 +63,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_self_attn_block_n1_weight.f32.bin", - "sha256": "fdcf9066e761f2f195c430f007594e21aa66f1234c0b85328040f9e7e554dad3", + "sha256": "c2e362ce5f59f6f6086843ed701ad3d3dfaec44f641da7a2be9fd16e0be21c62", "shape": [ 640 ] @@ -72,7 +72,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_self_attn_block_n2_weight.f32.bin", - "sha256": "6e74eda63198e8b627cb92dbf9ccacca9f96deac1a7d2c476d4b6cdbb9dd35cc", + "sha256": "ec08bf70a433d42cd2eb3a285a8612deead826ed83e7e4f35a39cd7ce353f041", "shape": [ 640 ] @@ -81,7 +81,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_cross_block_n1_weight.f32.bin", - "sha256": "e5ca042ac675538a09d1f203f5612ddb70ce142851f2a7230072bcda2f90e4ee", + "sha256": "5ec1779722dc0fda7f204111f658f2977944f145389cb41b4dd7e43bc8eb3293", "shape": [ 640 ] @@ -90,7 +90,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_cross_block_n2_weight.f32.bin", - "sha256": "17201b47c33c425b4e205726a1dd0160224d21a7816a27b3cb2482936373dde7", + "sha256": "e63f46aee081e5e0c9d914cf5a63990a7f8cdf18d69d1c9e3bfd5dac3f529414", "shape": [ 640 ] @@ -99,7 +99,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_self_attn_block_n1_weight.f32.bin", - "sha256": "91b80f1512d95b8b638e62d76ca66106598d2a41de988d6f8403bb16bf8fc4b5", + "sha256": "bf626ce4b9540732ae4b0e41e6ecf8df9d37aef2c0f7835fe82da74e8f8350a9", "shape": [ 640 ] @@ -108,7 +108,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_self_attn_block_n2_weight.f32.bin", - "sha256": "0d7f5387a2d28ad4f6e0ee3b902c0e0ebb6ece2960c479f6591f1cfeccd1bb3c", + "sha256": "19644a427ac6450eac03f470c361290f3d1045900726fcea28a9973373b5c76a", "shape": [ 640 ] @@ -117,7 +117,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_cross_block_n1_weight.f32.bin", - "sha256": "6cf4842fcdc048c1a9115fb862bf401bf0504315cfd8afd393ee98ec614393b0", + "sha256": "86e9c81d560b6bf1d1ad5b41f54e516e751e97f70c874b0c9adb6fbf61914c3d", "shape": [ 640 ] @@ -126,7 +126,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_cross_block_n2_weight.f32.bin", - "sha256": "803b8acfc59c8244383517cb942b6e521be21bb3066a7de0ed452bbc49312fef", + "sha256": "3a71a2d3f2600a26735b357ddd3a4958bd4590964d149155f1c2167089349d9a", "shape": [ 640 ] @@ -135,7 +135,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_self_attn_block_n1_weight.f32.bin", - "sha256": "ba167f943b727d733c4460cbd347a4e7a2e7465d6dbd94d2bfc011935a1a9bb9", + "sha256": "3ac4f3b079f383cc503850ddc0a18679c166364488cd12cf5521d9e1c5baaf34", "shape": [ 640 ] @@ -144,7 +144,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_self_attn_block_n2_weight.f32.bin", - "sha256": "31d621d52ff0754ff33599bf8d85762a7458dca818ddce1c93310648f2b2a5d2", + "sha256": "8ef13c495f661d19e234362142100d58912a517f4d290dab698282de1821ab91", "shape": [ 640 ] @@ -153,7 +153,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_cross_block_n1_weight.f32.bin", - "sha256": "40264c9a18a77c788d5230f95c0de43f008b8f846a0be466a875f260b2b5b057", + "sha256": "9ae1fc97c13441dddbbb3e9eb5d47198a3d607c88ec4e43c93d2c81bde27b4d2", "shape": [ 640 ] @@ -162,7 +162,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_cross_block_n2_weight.f32.bin", - "sha256": "091cf7ee073bd6638db219adb03f4295ab68be5d7721a4a7135ab647a3d17b20", + "sha256": "429c331c002c12043871fbf215b416f2db8a1d5f79ce9431a6a907ba17eca8e5", "shape": [ 640 ] @@ -171,7 +171,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_self_attn_block_n1_weight.f32.bin", - "sha256": "2d5aed83057285fead1f0ad341fd4e45739d408df90af9b948e00d6cf672ff3a", + "sha256": "4ff58a140da536f85cb1e90acc5235cd45559ae129fd770960044e4c630fdfb9", "shape": [ 640 ] @@ -180,7 +180,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_self_attn_block_n2_weight.f32.bin", - "sha256": "addf0c1c46f80b69327ed9ba9d291fc0ac3f8f46b1d32430a0550fcfbb9bdf81", + "sha256": "de3959c7d087a5d74e7cf13df2097222754acff9efb0d2f661578d10ddd176a5", "shape": [ 640 ] @@ -189,7 +189,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_cross_block_n1_weight.f32.bin", - "sha256": "622fd2c7811caafb6ec4b6672cdb77d6b1a2677a86156c8787c7e076af8ad2b6", + "sha256": "b009766fbf166bc3f7a0dacd2d9a161fc04e586c117a836ce0ebd9fa1ca3ec6f", "shape": [ 640 ] @@ -198,7 +198,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_cross_block_n2_weight.f32.bin", - "sha256": "df5cba19f68c1688c76c00ae547fd4417319068557d1ffd631fd306c774c735f", + "sha256": "d40db0671193777c76f5cb7dbdf13f7545a871771b35b770dadd31ec7e825b7c", "shape": [ 640 ] @@ -207,7 +207,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_self_attn_block_n1_weight.f32.bin", - "sha256": "36f463ae849c04e510290002b2baf5b6852b7f388e8e75ee98365ad3d8a12764", + "sha256": "74d5d626c5d30fbcb004d3b9cccdcb680d0dceac061d3c9ad3e3367a478daeb6", "shape": [ 640 ] @@ -216,7 +216,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_self_attn_block_n2_weight.f32.bin", - "sha256": "2e36fb000644e19c7de577abdef101e67362cec1f4866028d06494320f770617", + "sha256": "ca807c21a8be5611a6f3d26636658cc23b0294f7a5372f3b1a4e3552a31cbdb1", "shape": [ 640 ] @@ -225,7 +225,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_cross_block_n1_weight.f32.bin", - "sha256": "44104d135d3013adbd3b9cfd7245f9c2567d998d3417cd8f5588bcbc34e2996d", + "sha256": "0a7029d09d53f7812b45876923a3267f322dc1f873bab81b4099f72c1eb29f46", "shape": [ 640 ] @@ -234,7 +234,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_cross_block_n2_weight.f32.bin", - "sha256": "46f24a5c1006acec251c6615268e31cea8682feedf76839fb16cde44f4fde5c4", + "sha256": "1539fa69b705976b0158b27c31a421b0103398f5b7d938e1dec79c871eeedfd3", "shape": [ 640 ] @@ -243,7 +243,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_self_attn_block_n1_weight.f32.bin", - "sha256": "67b346c953e25cd41b9f5ce533d93e3c3bd5869505b684be203c676d7b7179a9", + "sha256": "5c5c49ebf225953e7a3c584cd779e73c253e11f01ff26749229b9c9b47cc6a41", "shape": [ 640 ] @@ -252,7 +252,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_self_attn_block_n2_weight.f32.bin", - "sha256": "451996b77d575d3d1d40c5e1e9d96c24448c93d039999b91d132b7d4b37a001c", + "sha256": "7ab9b449fdbfc619624903516d79e6f920b50c2ceb15d14078c3782b0a4f3f49", "shape": [ 640 ] @@ -261,7 +261,7 @@ "bytes": 21009920, "dtype": "float32", "path": "dense/enc_embed_weight.f32.bin", - "sha256": "4f4e6de1db97417c8e97c5e715dd064b5c33c9e94702ac758166c94c5cef61da", + "sha256": "78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df", "shape": [ 8207, 640 @@ -271,7 +271,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/enc_norm_bias.f32.bin", - "sha256": "3137fc19f4ff925c8811da6be650c38698d307578e74cf3757fd3607a0be0c29", + "sha256": "73c7b6e76072acad2244afc73657d29377fd189a8af9bc41daa14aabb346606a", "shape": [ 640 ] @@ -280,16 +280,26 @@ "bytes": 2560, "dtype": "float32", "path": "dense/enc_norm_weight.f32.bin", - "sha256": "d08173a24ed7c4e20a10a518254f215886e33efcf83e185160a4c033cf84ad4c", + "sha256": "fbce78fa3910cca15c0bec29f929009612f7f5b94d1d083771ed0b114bb2a337", "shape": [ 640 ] }, + "enc_pos_embed.weight": { + "bytes": 10485760, + "dtype": "float32", + "path": "dense/enc_pos_embed_weight.f32.bin", + "sha256": "41e06124cce8055432e8e6a7a9a9a2a6e39ac672071f23dea5872bd19c51e4d9", + "shape": [ + 4096, + 640 + ] + }, "encoder.0.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/encoder_0_n1_weight.f32.bin", - "sha256": "9dd433b1403ac0fe16541c304a42d3e67b0b2cb32b47e872ed0be569596e6e66", + "sha256": "146bdd3c5419ea957cba0919904c3fa3a18345399e1190e38b1697c5bc56a18e", "shape": [ 640 ] @@ -298,7 +308,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_0_n2_weight.f32.bin", - "sha256": "9d33d04a66bcce116bbd0bc6072b494a5f68c3e77f69f0549326f66a75c68b5e", + "sha256": "2817160dc2b42d5f8de29fb566ed4165dff109f084f8a5af1766e544a7fea509", "shape": [ 640 ] @@ -307,7 +317,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_1_n1_weight.f32.bin", - "sha256": "177e15460da20c7b1452c39daed8b193781de5a7723a82eac4b9089897447a18", + "sha256": "4b3b5cbb90b337e7c217bfe73872429a99ef7aaeda0743a01e7c78b496abce08", "shape": [ 640 ] @@ -316,7 +326,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_1_n2_weight.f32.bin", - "sha256": "99cc691f53f600e90d3f636f673359af993b1f2f2ce259f7dcb61d6d1647fbab", + "sha256": "2030393e0c8cc4554a10187e03f03e541a380227d3b64c3f6455aa23d8295be6", "shape": [ 640 ] @@ -325,7 +335,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_2_n1_weight.f32.bin", - "sha256": "84cea3917081531f374901364d9a36691227083d011ac1364e01c8b1866b2ac2", + "sha256": "203d16e2f34a9fb6059e24d8bde0b3d2e85e8edbeaecb2eac7c647b9c81f1dde", "shape": [ 640 ] @@ -334,7 +344,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_2_n2_weight.f32.bin", - "sha256": "5f14762332dbb644ff274586a0ba82af4be2c4cdc469d31e166d488044c9dd35", + "sha256": "a223438f7de8e65465b9c95605748e0152bc1b92d77b72d3af2a41d9ff108927", "shape": [ 640 ] @@ -343,7 +353,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_3_n1_weight.f32.bin", - "sha256": "1abb733c2331d9145ca33290b207dbbc6dc15053f56aaef9b659df4662b0eb41", + "sha256": "6f97f7dc429e26a0e2950787e5ec7c9fa3c3ab9b8ddd0fc1279c19908fdb9868", "shape": [ 640 ] @@ -352,7 +362,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_3_n2_weight.f32.bin", - "sha256": "4c7407197d1d85e0693f4056925b029929bc471f659557c9a39f0383f6cd3266", + "sha256": "9754f40fc928fdca4359684c41888d1b3d6af817936af59b161f3824b32534ff", "shape": [ 640 ] @@ -361,7 +371,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_4_n1_weight.f32.bin", - "sha256": "eb44b4546a957ecc9b8f8c70b985fdd04cf7b634d3b1ebd4aef456387beb683e", + "sha256": "2195f562646510d2e377c5d219dc1341d32001ed30b4d54cf754462cbcd175a1", "shape": [ 640 ] @@ -370,7 +380,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_4_n2_weight.f32.bin", - "sha256": "7626d463427ded1e6da5602867bd19a5baf2496d49c21878cf392c4acbbaa645", + "sha256": "75fda5bbfe2285970162c18ebf565ebe3e4032b2751b4bac289409a0ed8cb12b", "shape": [ 640 ] @@ -379,7 +389,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_5_n1_weight.f32.bin", - "sha256": "0d756e71405f5928a6ae70ef262b4237a8584a795a60eaa158c1a234d05b2bc2", + "sha256": "eb288cd1ccb8e5b7d5da5e6fa88afd881471b0bbbd355e14adbc3b885385e71f", "shape": [ 640 ] @@ -388,7 +398,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_5_n2_weight.f32.bin", - "sha256": "b7fc6eb738eac62a7880893a3c3f35913ae958f06eb9593942bc2fc63ba1f9d1", + "sha256": "75218ab909794e1396d0a651023851988cfea12c5085c9230b883188d3a66ae1", "shape": [ 640 ] @@ -405,6 +415,7 @@ "decoder": "dec_embed.weight", "encoder": "enc_embed.weight" }, + "encoder_position_embeddings": true, "final_norms": { "decoder": { "bias": "dec_norm.bias", @@ -1293,6 +1304,9 @@ "n_heads": 10, "n_layers": 6, "norm": "layer", + "position_embeddings": { + "encoder": "enc_pos_embed.weight" + }, "rms_norm_eps": 1e-06, "supports": { "batch_size": 1, @@ -1349,7 +1363,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_q.packed_weight.u8.bin", - "sha256": "f2eb1c46f31e66c4514bf852f88b348e101f0c5d590930219cf0dc628d206476", + "sha256": "951c976f47b39ba620a2703f97b02ed8e753ccd8bb95a9c61ed0911139dd9009", "shape": [ 640, 160 @@ -1359,7 +1373,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_q.scale_values.f32.bin", - "sha256": "1b78ea9eedffdde48507aa32fda72ce0017963541a013b187aceb94fa9e221a4", + "sha256": "58f656d894a6673181860f8ec88093f0a6254b00ce39b1cb1e108f1615e638ab", "shape": [ 1 ] @@ -1420,7 +1434,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_k.packed_weight.u8.bin", - "sha256": "2f63ce5b91036dd26a20804e19e3fbddb0ce8195855c9e802e16b4159806e016", + "sha256": "0d358351e42a919e6f41efc8d3d8220d202c7a2592a36b18b1e4039c0312c49d", "shape": [ 640, 160 @@ -1430,7 +1444,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_k.scale_values.f32.bin", - "sha256": "d8473447ad8c185def4c9c3ff9c2d9d3eea1870c01697de407ffd7f06271127d", + "sha256": "363a2535ff463d2406751ad619b676aaf8f5043f972b10829d70e5c5370541e4", "shape": [ 1 ] @@ -1491,7 +1505,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_v.packed_weight.u8.bin", - "sha256": "11bc624dbf8bd0c250e711eaa29632f9d3348f21c9b3c9d993c908a2476a0d48", + "sha256": "5f2fd0f6297addda94dfd003cc2902fbce3b926e9d3ccb9fbf56f118ba987bc8", "shape": [ 640, 160 @@ -1501,7 +1515,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_v.scale_values.f32.bin", - "sha256": "126404b59d4db50a3fb6fbfb0cd22a8ad394b3a2181ba9f0f189443d7560db56", + "sha256": "834cb863484c883b449cc141b0d11a1441c8d5d4c6c00b76092e54b1b9726ffd", "shape": [ 1 ] @@ -1562,7 +1576,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_o.packed_weight.u8.bin", - "sha256": "e68c975be66010affb7679586381681af5d449d90380aa8333bf01ce8c266c39", + "sha256": "83c19e24982850a0703bc51352e8d2dcf2d9c58cac17c3fb58815327b0117251", "shape": [ 640, 160 @@ -1572,7 +1586,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_o.scale_values.f32.bin", - "sha256": "29c8b68c8c6d1ed6f90d6e01800fa4da76dface1f032e86f807e07e6ce500150", + "sha256": "92e6c93ca7bf5dfca57fdc636156023c476dba44daa150855c770b191b2812d0", "shape": [ 1 ] @@ -1624,7 +1638,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_0_mlp_w_in.bias.f32.bin", - "sha256": "73208703f263f727756bd48cbd994daa526006f49f7a0b5081f0fec0390c6262", + "sha256": "3a2cab48442eaf53044fbe153c8e3688fdd3ec3c035f8edeeaf67d3bcddaf4ff", "shape": [ 4096 ] @@ -1642,7 +1656,7 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_0_mlp_w_in.packed_weight.u8.bin", - "sha256": "7ab9b1aebe99f1dd0c8c67488d9d137e540f1e11c6b5b8bad401c1ea126ce834", + "sha256": "8084c90cad779fcfbf3a68dd3d751dab75a495d6798f8d125b67ee076582c72a", "shape": [ 4096, 160 @@ -1652,7 +1666,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_0_mlp_w_in.scale_values.f32.bin", - "sha256": "77cc54c25fc58c33ae5ac086bc2f27f02eac61df14eceac3e8a03410bad8b7f2", + "sha256": "fc25f4d74c3d8a0be61dd9b7b006c93e806bc6dc048c05e98596e8542c1327c8", "shape": [ 1 ] @@ -1704,7 +1718,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_0_mlp_w_out.bias.f32.bin", - "sha256": "ed49c800405f2b13ac01856aed66154cd2e1aa6405de541986706eecb22af8d3", + "sha256": "6d95b0054d8d8c155e33665b1fb3c0dd454478ad2a95eba4316160883bdefd47", "shape": [ 640 ] @@ -1722,7 +1736,7 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_0_mlp_w_out.packed_weight.u8.bin", - "sha256": "4b0d77b5c3e1e79d71ff659e164425aecde16daa9e9a480ab3b8ca044e5bcad5", + "sha256": "2b475a637893e79948117383cd9138d44690a04653e49985b355e6e63693a783", "shape": [ 640, 512 @@ -1732,7 +1746,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_0_mlp_w_out.scale_values.f32.bin", - "sha256": "9e53add4a0b7ab6184f4c36e38a5931859ecc3549c4c5de76131356cfb8b70ec", + "sha256": "827241212e161c00a58bf08aeb8e001a475599cfb6786c2945b15dc39afe3dc7", "shape": [ 1 ] @@ -1793,7 +1807,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_q.packed_weight.u8.bin", - "sha256": "8940fa8a4deb50d60c9fce77c30bff8e9cca946bc31abf081c2375570a288b2d", + "sha256": "abe92f5a662e92da5725883968212a2e90a77f05e8499dd0eb5c3134279535cb", "shape": [ 640, 160 @@ -1803,7 +1817,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_q.scale_values.f32.bin", - "sha256": "29b3b5b9328009be6b021713f0759c18c17a06ba90b3ef71a6e863ee0918be5a", + "sha256": "f92420a0087a6ad79021a64f1300eeb7d53c4146df1e5f92c339fdd606d4808b", "shape": [ 1 ] @@ -1864,7 +1878,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_k.packed_weight.u8.bin", - "sha256": "a94892001dbbde4f76f2bb974e8e5f1b016c8a1c7bedb4fa599e6d98e6a3f862", + "sha256": "27b7e94565efaf4b3c1518f3862c56328a9e2ecb594cdd76f52e8ecd87cbaeb2", "shape": [ 640, 160 @@ -1874,7 +1888,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_k.scale_values.f32.bin", - "sha256": "af573c1fcbaf6ed8e00ecee3be2df83045a17316c10bbc1204ec5d045243e648", + "sha256": "8e90310d7f602900c61d1ec0029aa69460d20598de178d6755dd8b6c42b109ba", "shape": [ 1 ] @@ -1935,7 +1949,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_v.packed_weight.u8.bin", - "sha256": "1a01f6835913c38e63770ae5fe0ab82479ffc2752577a6eb44d24af3e00d6587", + "sha256": "fe4fc47da4a97ad0fd49c5dcbb7175aec7a0d2f7fa4f9f82c2703ca88cd13b76", "shape": [ 640, 160 @@ -1945,7 +1959,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_v.scale_values.f32.bin", - "sha256": "47b1d24599171b0027ee130ebf038f4b1694a326f7d6a783678eedcccadfbf3b", + "sha256": "b2efaab082de4926716917ed6472d67ead22eaf2c71ebdcae672069a4acdf9fe", "shape": [ 1 ] @@ -2006,7 +2020,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_o.packed_weight.u8.bin", - "sha256": "f19e5897cb1f6b93eafa7777649e0d337bc230a814b8ecbdbf81316e4e448309", + "sha256": "e1d4ba087cb7fd9337ad647b9ef35af6ef83ef1a9e2611f177e7e76cec268d67", "shape": [ 640, 160 @@ -2016,7 +2030,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_o.scale_values.f32.bin", - "sha256": "b016b418d7fc1745d3617cbbc7b69aff439aeabd33920e142ddc659297ef3c0a", + "sha256": "94401ac4905ab9a6a51cd297f505caa81434ed03ba406ef6a8cc3e1759b2dbcd", "shape": [ 1 ] @@ -2068,7 +2082,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_1_mlp_w_in.bias.f32.bin", - "sha256": "76f3eb35f85ad10508ad5d77d1d368ef3aa6f9fd05e8855de5bb591aea755975", + "sha256": "025bae5bd7c6d3874c23d1348d4d32d7a5c399e719416f1b22112784599348f0", "shape": [ 4096 ] @@ -2086,7 +2100,7 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_1_mlp_w_in.packed_weight.u8.bin", - "sha256": "34a577f6ad2057bb305520709eeabda752495cd4fb693589c61f70a6783eeef3", + "sha256": "97ff605bae210a9b872523f788aa25bf06ae8da80eb62537ac6ba898ab0cd4aa", "shape": [ 4096, 160 @@ -2096,7 +2110,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_1_mlp_w_in.scale_values.f32.bin", - "sha256": "0aab2d4afd974f7590fd6bc26ba84554f25fdf581885f8c2933ce4cfebc8592e", + "sha256": "b14e688ad3655e5d1c26fc671f68d4911632515459181f058a45f5cc218a7973", "shape": [ 1 ] @@ -2148,7 +2162,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_1_mlp_w_out.bias.f32.bin", - "sha256": "144c6c1b2a8b8dcfad3773938ab747e78d26057affe44e238d073e9ecde4d0fc", + "sha256": "44d5985a564ba0032aee0a81b081ba706266d8e085a12c7f44d688918c8f4811", "shape": [ 640 ] @@ -2166,7 +2180,7 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_1_mlp_w_out.packed_weight.u8.bin", - "sha256": "1a5c8c3c81b509c6fdb649cc2e3ea49b1cc694ae6976fdfb721d49c474440692", + "sha256": "7742ee5975e591618aabc5105a207b0f78065d02ee41cc6b45ac88df12bb4c1c", "shape": [ 640, 512 @@ -2176,7 +2190,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_1_mlp_w_out.scale_values.f32.bin", - "sha256": "14782673a4a81e0073f5799d05e72677ba9b13ce33ebbea20066976706374f5b", + "sha256": "d4519cac1203163e20411c81058fcc9e15b2715b873377d9867a23f75a878b8a", "shape": [ 1 ] @@ -2237,7 +2251,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_q.packed_weight.u8.bin", - "sha256": "728cff4693aaa8b3412cda55a9c5eb3cd34fa3319fe0d32b47e769b67acf27cf", + "sha256": "4046b1503f400adae06277ce337563059601462ea3ed824adc1143d2bbae8d25", "shape": [ 640, 160 @@ -2247,7 +2261,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_q.scale_values.f32.bin", - "sha256": "a676145c71d793b31b8e1c700433b6c5ee619abe5781ae6a7f3d3138ebfc6790", + "sha256": "b6a2a79210118706fe89b4ddb96a41eb06075852ab1c209cdcab1652caa3907c", "shape": [ 1 ] @@ -2308,7 +2322,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_k.packed_weight.u8.bin", - "sha256": "a8a9ec384334edc880f6185c64a8bff5589bbaad2837e7fdd01171273fffc8bb", + "sha256": "32ed7fb622aff2cf751fbd3986344f581380fc2d004517e2b3b7ae111fd31bca", "shape": [ 640, 160 @@ -2318,7 +2332,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_k.scale_values.f32.bin", - "sha256": "8dd1eb0a4bd4d76edcb4df2a26bf09820b0823dcc01658344ff578826bf3a0be", + "sha256": "8607a763ae93991b49232ae2fd052fc67c7709ef43d9074d8bd91c940a2f4217", "shape": [ 1 ] @@ -2379,7 +2393,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_v.packed_weight.u8.bin", - "sha256": "556bfae148c0efc3fe914cf102c008342ebca522e62edfd5b2664ac32aa70c06", + "sha256": "64940ce687d9f5cac4bc5c0ebeedaecb3e8551bfaf05135a27c04b4158b9b9f2", "shape": [ 640, 160 @@ -2389,7 +2403,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_v.scale_values.f32.bin", - "sha256": "5203a15a236be8e0d05745452f1eba88b7ee04fc550a31b0839d4cf3bd15a90b", + "sha256": "17eb0fc4ae802ce844e776193fc48d96664c74682bd8ed65f0659401c25ccee2", "shape": [ 1 ] @@ -2450,7 +2464,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_o.packed_weight.u8.bin", - "sha256": "8fcf7d9111e69f47f88f1c1c02447b2c07d4edda7830a62241ce46b52d6bfd31", + "sha256": "4cd3154e5a261d3671f9255147f5c7c123b89e391fa8d95d0e0d8f0aee5b6824", "shape": [ 640, 160 @@ -2460,7 +2474,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_o.scale_values.f32.bin", - "sha256": "a48b17cd6544aead4b0d681a5bacb90b0fbb0dc0fbd5e9b43703af9d655fff28", + "sha256": "bd285179d72698f1f3ec0a18f279f4656df36d31c859f2b106ec8b01caa99dad", "shape": [ 1 ] @@ -2512,7 +2526,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_2_mlp_w_in.bias.f32.bin", - "sha256": "55f1ac5b29cccff2b7c2e26766f16f4eb81173f165d889b6c484a41b7adf6020", + "sha256": "756a058396dc773b98e7fb45c72299bb1402b3a7f4ff319a435fdae1a5a14a0d", "shape": [ 4096 ] @@ -2530,7 +2544,7 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_2_mlp_w_in.packed_weight.u8.bin", - "sha256": "d644ee10bc3b7f73bfa320283405780d256ef4809748bde34fdeb899369685e9", + "sha256": "5c27668c24ade7f4989551e3a23c729512fa3399126e8131a9a7c3b7beba93f2", "shape": [ 4096, 160 @@ -2540,7 +2554,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_2_mlp_w_in.scale_values.f32.bin", - "sha256": "77941e8d1c33bf8e9f73dfb3902ddaba54ae2b4c9d33a14b40affed7a230d658", + "sha256": "ea11ebc8e04d3fa09dad49efbb2465b461308a8353d1fddf1008c25cf47b1f49", "shape": [ 1 ] @@ -2592,7 +2606,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_2_mlp_w_out.bias.f32.bin", - "sha256": "bf765646a81720449bcd584215038473a9cb7ef7125e4cfba5cac598127e67fe", + "sha256": "1a85a10eac9d0a55eec02edf2e3b706e87066e836808c100715b883e65689cc5", "shape": [ 640 ] @@ -2610,7 +2624,7 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_2_mlp_w_out.packed_weight.u8.bin", - "sha256": "5ff72ecd699899e9a4ea52137bd662ca80a3272f8e51f2a98c97a6be25d4235c", + "sha256": "dd26321691449af82d643801b9262dff7365260cc32b665c25dee5889cd4df69", "shape": [ 640, 512 @@ -2620,7 +2634,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_2_mlp_w_out.scale_values.f32.bin", - "sha256": "97cbd68d328e18fbfda32667ee470c3aa4eafe78bd0b78b995f2bfe564bfcca3", + "sha256": "ca2d4e4c3da8b0e7a0ab688a4883b2040bebf1e22d545576a795c847e5ea2b28", "shape": [ 1 ] @@ -2681,7 +2695,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_q.packed_weight.u8.bin", - "sha256": "93a3d233014e43a89110fdbcd913ebeccbee67222bc170bdc097e5d1a14f790b", + "sha256": "baa0d119c263884f0022dff7e7e4020996ea2c91c9912f568f2ede5559432027", "shape": [ 640, 160 @@ -2691,7 +2705,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_q.scale_values.f32.bin", - "sha256": "9228202b5e7125cf5b8bdc0e53498cb8165e7130b718a59da5d6924ad99173c4", + "sha256": "adad57af78e9167da8b4e5855e46083456100ffd1ed101e0f84074e9496c7d27", "shape": [ 1 ] @@ -2752,7 +2766,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_k.packed_weight.u8.bin", - "sha256": "615881e833f29f120b78dde432d5328a8447ae9d1c08b242f523be3d019382d2", + "sha256": "5a9a3e87cb0ccf9381821b2c13cd09a88996d04fcd808ae3b6313622c9986444", "shape": [ 640, 160 @@ -2762,7 +2776,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_k.scale_values.f32.bin", - "sha256": "b45f07b7955b4ae7104c7df0c5d3fa813bf7125a8768ad0741d10a7acd3218c8", + "sha256": "c94e97d5feb0a8acb690700c648981cd8ddadef54399a0a263cb112141cea08d", "shape": [ 1 ] @@ -2823,7 +2837,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_v.packed_weight.u8.bin", - "sha256": "7c3eaad05215d7ee91070277ad7518baa3fd19b900c5b2c6ea621f51f8d7e577", + "sha256": "2bd7d1359728efce205ef25d36c8d47b7ded204343a3074ca03ad64bb485ae42", "shape": [ 640, 160 @@ -2833,7 +2847,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_v.scale_values.f32.bin", - "sha256": "350d62ab7cd78d7c07e33dda62d04dbbb68586a00b5fc3d7cdfca3d59117371f", + "sha256": "f7b3d178706d789bfbc5ed3419c8abdfce30d733cd967d5a7ce3f92560ecb7aa", "shape": [ 1 ] @@ -2894,7 +2908,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_o.packed_weight.u8.bin", - "sha256": "670e7caebcbd937e313590599bad83fad1f999d2e4256a21dee1119293d069db", + "sha256": "6291c1abeaaea0b97649438a296d76ceb106575b71884102d3542b00ef05e8c6", "shape": [ 640, 160 @@ -2904,7 +2918,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_o.scale_values.f32.bin", - "sha256": "8b688d988ba3c12fcbe0b2cd81b3140a2a7403d7c986f99a0398856152282ae1", + "sha256": "bd39061fcce791e35176cff9de492ef93343a6c39e27730e241ddedfb549a768", "shape": [ 1 ] @@ -2956,7 +2970,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_3_mlp_w_in.bias.f32.bin", - "sha256": "9b94e5c80466ca951ccc2ce5e34b000be946db165d23abc5eec20731ce507504", + "sha256": "fd93590315d0550dadb82709589d499011558085fe7f42aa87a41a87c2742e9f", "shape": [ 4096 ] @@ -2974,7 +2988,7 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_3_mlp_w_in.packed_weight.u8.bin", - "sha256": "db06ff658696f3c55e103c70b7e2c0494f68492ec148363b0c06f2c2e64da426", + "sha256": "8b117e51f471d478c8c5da5e498e0635c1ce74b32e75e4d923b6485ea87353da", "shape": [ 4096, 160 @@ -2984,7 +2998,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_3_mlp_w_in.scale_values.f32.bin", - "sha256": "d08e720749c4112b88d0fe34674fb6851bd5ec321c3e8ac40d4b157cc60c99c1", + "sha256": "49e75f99e2d5f25276cbb411044e6acc42c8b520b449a0e88d0f36927fdb3b9b", "shape": [ 1 ] @@ -3036,7 +3050,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_3_mlp_w_out.bias.f32.bin", - "sha256": "44865713fc16e41e8061e1be0678e07e8f85157d5c540b51c9a79b52090b1cbc", + "sha256": "0f4777ca7ed1def47f66c0c13245e859f585b3401bff9b2fc0692869bcf6c3b8", "shape": [ 640 ] @@ -3054,7 +3068,7 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_3_mlp_w_out.packed_weight.u8.bin", - "sha256": "e5afd5b12dbc0a921c3d5be92f444c00e9fe35514919ead5113bfbefe70eb423", + "sha256": "3ddab3f329beb5d19a28e69aef00ac69b708a6696f78e84254033d362b4cff02", "shape": [ 640, 512 @@ -3064,7 +3078,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_3_mlp_w_out.scale_values.f32.bin", - "sha256": "9c245c034ec27db041b7a2cc308dab23a6ed2db32a09af0fb587d2826dd8e5db", + "sha256": "fc14d3937542e30e559658d7b9bb2377fd78c81771e3f3e7cc20c690648ea7b4", "shape": [ 1 ] @@ -3125,7 +3139,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_q.packed_weight.u8.bin", - "sha256": "a745262c6dfa925e52caff29d28d589cc7f9a0de2fc31b66b1193d884a086c7c", + "sha256": "728a805cfca6f97949f88c31871ef1be00603a46d9bf20fbbeaf9a63ecd92167", "shape": [ 640, 160 @@ -3135,7 +3149,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_q.scale_values.f32.bin", - "sha256": "018d0aa83591d3aedb9e18e578bef80d29a0c8b145d07831baf7736115ad6102", + "sha256": "3b9e454e60a6a13e5102da4c03d527762bcf2b9bf12d486e799d61c3658c8dcd", "shape": [ 1 ] @@ -3196,7 +3210,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_k.packed_weight.u8.bin", - "sha256": "2b50baad9a382d17d6bba2109fe7c7afd6c658bef1533c4fe2d534ad427f7c43", + "sha256": "10a703b02e24bbfaf3495bc1425befd4a89e9c6f09744e2a1c0706355cbcbeec", "shape": [ 640, 160 @@ -3206,7 +3220,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_k.scale_values.f32.bin", - "sha256": "9025f9bd080125d7499f6b4a768e6226046f736c06332055fc868f48b89f3a46", + "sha256": "531f130bb155c8228c57f8775050b5bc55fe608c07b428bc621c7a2397638773", "shape": [ 1 ] @@ -3267,7 +3281,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_v.packed_weight.u8.bin", - "sha256": "90309d347ca7a149c7aec39fe41ca1281b0981220a4d9d7e81ff92a6838ce3bc", + "sha256": "e5d4f475baae4060d3cc5a3a82f3a52ad92447d23710c3bb3577d99a02ce890d", "shape": [ 640, 160 @@ -3277,7 +3291,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_v.scale_values.f32.bin", - "sha256": "62dcd2181659d271311c3f48d2d30ffa824fc90775ed78243af216b5e5dfe17f", + "sha256": "8dc5c14c4a1ce0a7eda48fedb3496c154e2fd035b372b8c1fbb67ebfcbc3ad95", "shape": [ 1 ] @@ -3338,7 +3352,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_o.packed_weight.u8.bin", - "sha256": "70bd484dcdf0064d9638b964c017b1da8bc62a86534a7aad8f4637f467b17ec6", + "sha256": "a94d196e77a98f4ed95df7a9102b2991e536dc5f3071302b1a497fce6d5de673", "shape": [ 640, 160 @@ -3348,7 +3362,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_o.scale_values.f32.bin", - "sha256": "0edd3e4c033ed0928aae622f4c279639a88e324bd180d1b7f2a86a0ded3a7f2e", + "sha256": "65dafd5676fdc4978472be0e5ffecd6e5ec5549fb6d5664b79e8d02e4cd0878d", "shape": [ 1 ] @@ -3400,7 +3414,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_4_mlp_w_in.bias.f32.bin", - "sha256": "9af5a6606f55fc82f725d4cc9ce177d34a22ea92bade6df259d63436380fedad", + "sha256": "1895bd3a783cadcce33598fd40adbec1468989bfb911673a0fb315883e21647e", "shape": [ 4096 ] @@ -3418,7 +3432,7 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_4_mlp_w_in.packed_weight.u8.bin", - "sha256": "330c9c65ca8995c4ee29fdd90955945bce2aaab71c92537223aea7aaeb0d6569", + "sha256": "9d3742046e3c417116c43c76a09c313d31979170bd39d42a5dde6f0a7e9ad08c", "shape": [ 4096, 160 @@ -3428,7 +3442,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_4_mlp_w_in.scale_values.f32.bin", - "sha256": "03dd37152ed6956f01f128e4d651326b253d0a7e3b9a35a65070922e5e1a21fb", + "sha256": "88b516eb6de001eed4819d59a8e8af51f48eabf45e0e08400cf7351198e404b8", "shape": [ 1 ] @@ -3480,7 +3494,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_4_mlp_w_out.bias.f32.bin", - "sha256": "c920b2e3ea660534d14bea1df49772cc1b36d4faa2316234ae134ef3e588e302", + "sha256": "a37f53e3778a72816f2020f1e2e74ce0387bf8f7f1894bcb5e21337b17a975a5", "shape": [ 640 ] @@ -3498,7 +3512,7 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_4_mlp_w_out.packed_weight.u8.bin", - "sha256": "64b20c3eac7e24b676d7808230d57df66f48ddfe2627d40f5ea7ca8818d0535b", + "sha256": "cb2919b644968c18f3d8d07f4a7c2dff37300f3a19ca9252d608515e27356843", "shape": [ 640, 512 @@ -3508,7 +3522,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_4_mlp_w_out.scale_values.f32.bin", - "sha256": "7c930bcb7eb3ae14e26747f63a85e3bc9b5d51910ffefdcf0aed5f03081187c5", + "sha256": "acf932162b73f02f4dac3a61e9fbb063804e282e457542dcb81087ac0288e496", "shape": [ 1 ] @@ -3569,7 +3583,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_q.packed_weight.u8.bin", - "sha256": "17992f4e033ba3cadc4024b246db460439d524500fbaa3e80fecc32c072015e2", + "sha256": "7dd4d44c1ffabf832cb1a2de16b9fe41eda6fdab014995e14d8e985656429fef", "shape": [ 640, 160 @@ -3579,7 +3593,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_q.scale_values.f32.bin", - "sha256": "dbce1773e2798fbe649bd5b896bdd54ef0e360df6c126fdf0d1c28733486cf99", + "sha256": "7624e04915864961ee93653aa33a552ae72de0f333aac4bb5070ee12d3164a02", "shape": [ 1 ] @@ -3640,7 +3654,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_k.packed_weight.u8.bin", - "sha256": "bdb31459fec6790046f058ff5417102ba655f3a943cccf66396236fa663f14c0", + "sha256": "6050252cdefae7097fef44b72a46832ef84555bf3129e31fb1706699b54fb993", "shape": [ 640, 160 @@ -3650,7 +3664,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_k.scale_values.f32.bin", - "sha256": "933fac989d60e00f6148fdd80406d4d8b0ef95e2bb1c5bf0bb7d6eeabbf50325", + "sha256": "821f63202f456185ca334f8df5549720d54d696d62ed9ae84dfe0ba200913545", "shape": [ 1 ] @@ -3711,7 +3725,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_v.packed_weight.u8.bin", - "sha256": "ef7c5acaddfb0083d3330e6b8f54dad6c037482910066c47374e42e8e756a303", + "sha256": "e53e30cf99dfb375124f09e4aafd8f94d002f350320d64ed184535c6494d67f7", "shape": [ 640, 160 @@ -3721,7 +3735,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_v.scale_values.f32.bin", - "sha256": "51b137bb07bab1f7ae40e9693fa260009f5709a974777b2b4bd4bd8daf5f2e9f", + "sha256": "f76061e291a207776605c5ad3c7d62fe4d33568ecc9033af6c0b627e411b3c11", "shape": [ 1 ] @@ -3782,7 +3796,7 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_o.packed_weight.u8.bin", - "sha256": "03fac26859771cd01d5af4fadacd835790eb7bab941be228b4bbfe723b31b03d", + "sha256": "0c9021bc8c3337e9e07cdeac52581df7895492820dd4c39aa2a8fa0a170e21a0", "shape": [ 640, 160 @@ -3792,7 +3806,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_o.scale_values.f32.bin", - "sha256": "7ec8adf1d1d949c1dc66df40b209d212892a4c0879e1c25a3683c676db9321e8", + "sha256": "79dcab88153ccd85a92bf06a820212da7514276d13c9d246b383731a60ad4278", "shape": [ 1 ] @@ -3844,7 +3858,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_5_mlp_w_in.bias.f32.bin", - "sha256": "b0602c6e9911ecf12d950fdbe9578826bece7652a4ffe3a4c4d09336867de439", + "sha256": "84867af91e82c506906ddb71b0a230680dd925d90773bb297b7fd5b0b7713542", "shape": [ 4096 ] @@ -3862,7 +3876,7 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_5_mlp_w_in.packed_weight.u8.bin", - "sha256": "701ef35d26908f55fbc1c25559a106e3b9996c6017650de149acba30a6b452b1", + "sha256": "93f7b29f255947dd72d7a5ad15b60f2c68c4b3e148b922f4794bcf96bf7aef87", "shape": [ 4096, 160 @@ -3872,7 +3886,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_5_mlp_w_in.scale_values.f32.bin", - "sha256": "75b4b4d89d08840c2f4176f269224be79faecfaced1b6be41d285d0d1df7dcff", + "sha256": "07471f0e22ba2cd8c2c7b735c203d91c874fc834b4209788a236fc9529247943", "shape": [ 1 ] @@ -3924,7 +3938,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_5_mlp_w_out.bias.f32.bin", - "sha256": "6131b28da40f02a17f49f84ea2dc74a0ce5b702e2f0d9eb4392ea28bb85c4e76", + "sha256": "d1ccf0c6e752d23d27842dde01b4bc430190dab45e3bfa8dd8417dfe4c13cb15", "shape": [ 640 ] @@ -3942,7 +3956,7 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_5_mlp_w_out.packed_weight.u8.bin", - "sha256": "83b2c60db531b3fa20066c2c4e1950b6900a7a27fb932eab96df17efd383bcab", + "sha256": "5c8cf16a336ac7618477e7a52f8eb8b12d5bbd7004f961745f08abfb3f36039d", "shape": [ 640, 512 @@ -3952,7 +3966,7 @@ "bytes": 4, "dtype": "float32", "path": "encoder_5_mlp_w_out.scale_values.f32.bin", - "sha256": "d06678dcf842cc83e25aa12695675d8abd59d0dd3002a6a70d8b6e78b53af1c8", + "sha256": "4587070b10b62cb7687541b3e9946824e292b8f024c39b9d388202d61a5244b4", "shape": [ 1 ] @@ -4004,7 +4018,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "6da013727d9557ff5ea212b7d124340fd66cc6ae8324710fc48077d8b77efce7", + "sha256": "738b38445bf3e8a03e758d3c67b687f1349b33ecb802888f642e1c7b46a65d17", "shape": [ 4096 ] @@ -4022,7 +4036,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "481bd133a5c48455630d34e2961c65d13f8aba072205c152dacc131795637e85", + "sha256": "2879daff121daeb59a75ae0cf2b8947e8591f2a94508e838311fee26485c3554", "shape": [ 4096, 160 @@ -4032,7 +4046,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "0d5c9cbece594a01b9fc12756117ac0994c4a329b9bad1a30f2160e9fc42d261", + "sha256": "b68d1acb8653e3e87271faa0828042ef37a00bfa0dcf2228db49017a23b67949", "shape": [ 1 ] @@ -4084,7 +4098,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "d48a4623aa0453584d08f60a4c993f6ec7450c22f87d0b41042440a93909d2dd", + "sha256": "e057a152b1e3b3bc1f982c0c5ac0c80853a2d0358775f9a74cd2189332b80336", "shape": [ 640 ] @@ -4112,7 +4126,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "adac014368b20fd45628680e0d18e4dbb100dba15682564651338ee0619f0a4c", + "sha256": "d45c24f580c64ad0f07e0f5af42a50d887322f039d32b0b7b7aa79d85e9c3d7d", "shape": [ 1 ] @@ -4173,7 +4187,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "73085bdfeea8e210e3851ad505e3ecb1a77d6dba6a3cb56452de02eaeebec1b1", + "sha256": "e7f4ef6d97be20f7ac273b0280302bf087151da75c4a2bc645ddbc74f340279a", "shape": [ 640, 160 @@ -4183,7 +4197,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "35aaf02e17f4cbf3a47587d3b8abceea4bc0716327ad1dac8e610870105bd75d", + "sha256": "e1d0d0af2f97073330992aed3e464957c7f31a5196fdd8525637cfdb0970f042", "shape": [ 1 ] @@ -4244,7 +4258,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "cbff1d78a3feeb67fca9095fea92fe40cc282a45776459fe82aa749922f4d620", + "sha256": "fb1445a194065f84f93d6fedd73113035d7beb2314d7cdf77a5731700c05ccde", "shape": [ 640, 160 @@ -4254,7 +4268,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "3209a3fdf503c3ccdd78d46a0013a46932396b116c08dd33d5458e5b3d8b7d46", + "sha256": "65dc763995a05d919bd32c3ae62429d6ae6e5dc59d7570e9e511e617400d105a", "shape": [ 1 ] @@ -4315,7 +4329,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "ead4eb1e0d6c62532a7088f16445356b1c1674a11d19e0f2c5b5fe66f18188bc", + "sha256": "819396927e490b8c3959c6f006c112eb768d02d74b6b86b7afd8f7b372c1e2e8", "shape": [ 640, 160 @@ -4325,7 +4339,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "6c9df1445abe44f288e97f6233aab7f6bd2757d75bca91a527dab2c52b25e5cf", + "sha256": "258663b01b5d4aae55b2abc15b3e8e87db4a75c52f141f4ea132b1ed11ab0150", "shape": [ 1 ] @@ -4386,7 +4400,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "b81593ee5f78bff319625a598ee3a326e450ccec286f4f054c41716a7a6c44fe", + "sha256": "e2f907585a66def6ac95c943ab6364491d9410323d6c2acf1e7d85f583b8cad6", "shape": [ 640, 160 @@ -4396,7 +4410,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "62d4c1ea8209bf8ef3c900abf620e9e98250331c70728a08ba701a897f680e97", + "sha256": "7c7233dbf0113e851ea6a854beae2f1c9ccf2871a1cc8798a07d00decccab7cf", "shape": [ 1 ] @@ -4457,7 +4471,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "827dce8c453eafc2a1a5f73a75a2c6b7146b867b4c1e134609175df6cf4cf101", + "sha256": "97f87a393223a02090729500d41370d7d7d30a269b7710c919abfc48e7c008bf", "shape": [ 640, 160 @@ -4467,7 +4481,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "87ea67f73d751bedaa48a82d1ab55f6824ab8136e2e91b9d610662ca8601e763", + "sha256": "9b6668ebf77529a1006886dfc7dd0a74b54b295645cd3c7454c113143ca5a575", "shape": [ 1 ] @@ -4528,7 +4542,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "3ec4ae80b24ffa71a637d7223b360d3928124c6487a2b9d714526456828930ae", + "sha256": "982b011fe87a1a8b0c2d5b4fcf645a9335e5e7e2e8a48b6983c879835a6aaa1c", "shape": [ 640, 160 @@ -4538,7 +4552,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "9f39d50bf53473b96c7d6b64d06d61e07fc684226defd840191874dea5bc6328", + "sha256": "1cd84c7bf5262b70b638f322e6ea50dd15a935a42c023048e208794f1e6efe8c", "shape": [ 1 ] @@ -4599,7 +4613,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "73817a906cee71e8294c20ddada43956137ea65cb78d2d8eabcf7ac10e060a54", + "sha256": "1d14b3c5a2c23317ca7d3d144bad570d637b047b55b7a815621ab8fc8ec603db", "shape": [ 640, 160 @@ -4609,7 +4623,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "50c5f27dd38fad44d2d2ea50443fd9a6c50a187cbf389b3983179cc5f64d83bb", + "sha256": "e7afbeea361f30dea3b8b0647a08256bea9be60a1016f0efacb3af0316724247", "shape": [ 1 ] @@ -4670,7 +4684,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "e23f5fa340d288f9a9df5e568a7cc5aab98df574c8e6961c2b5e0fc99874c4fe", + "sha256": "4c26e3f5b35f3698ba7cf07a90484d2898796924e1486ca1912fbe48eafe2766", "shape": [ 640, 160 @@ -4680,7 +4694,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "8298b5baf8f1af425aea4cb4f9587959d4f8c0027ff71e9681d9b99ac5908933", + "sha256": "71212803e1148c154056c46a4bbcbf62bf0924bbafaa98d757aac03cedfd9dd4", "shape": [ 1 ] @@ -4732,7 +4746,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "00d2055f715b5ebf6759aa67eaa147307789564608619b6af16afe214fadd064", + "sha256": "243bc0ff5ab70374de5611e00f881f5e6ab2e37c01585d7cc91be33710e043e0", "shape": [ 4096 ] @@ -4750,7 +4764,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "b2779b7294d7662e5869dfa1828bbd9ec56a99aa7f79f5242be287385aac92fa", + "sha256": "41c4fb217a184ad7c74cccb1850851c1fec8dcf6749702f45c6f886b31434c94", "shape": [ 4096, 160 @@ -4760,7 +4774,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "8dfed15a2583ff098b973bd63595871e32e73b5601fd71c0a063349da4acb38a", + "sha256": "eaced36f128bb70455e0eb8d46b835775ac79a7e251254ebd2b0e6ec10378d0a", "shape": [ 1 ] @@ -4812,7 +4826,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "3e8ff4ab3a6c857f9460c554109293ea056e061373af980590bddd5ee2abd964", + "sha256": "93e5d268cec594d48d9e4dba6f0ffbdec30bf60c8f72614448b97c57e8de9d02", "shape": [ 640 ] @@ -4840,7 +4854,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "d289652991a8a6bbb6306b4ac100899fb2f35c3ad5beb337a41e9163b1979f7c", + "sha256": "c33677d40924532339ba17f96c7098ea6198b15280e68ed2ca8625912bd8aa8f", "shape": [ 1 ] @@ -4892,7 +4906,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "b7bedecafd00ab28da70dd1d41a643953d459aec0d48a0def292a86285947cf3", + "sha256": "aaf15965a9a06378c7f852dd52d89df50e6d385e134adf4af02f7287574f160b", "shape": [ 4096 ] @@ -4910,7 +4924,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "f9df04837ea94fe26b06971d5ea4373e2c1787e0454f1a07a40be4b7ed491d3e", + "sha256": "fa15212d02fd93611265b56ae98073e8df9c39fa11dd951d25dc73ae7c23161e", "shape": [ 4096, 160 @@ -4920,7 +4934,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "a76081e216fbbc68d54fed9f36782cb1ec75e3c46c502d65335f13bde902ed9d", + "sha256": "25bc94907fcda7ecdceededafb999a692c98ec11cb650db24936e5ef633806ed", "shape": [ 1 ] @@ -4972,7 +4986,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "c9d76e958c5d851419c40140a50474af301ead3f5a16f22c02d31e37c0ca631f", + "sha256": "97a5e1525e46a22cfc60a23ee4f5481ea11f3ca3ac5ea6f8a3ae7bdd90397012", "shape": [ 640 ] @@ -4990,7 +5004,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "e05789409db540df482a00110f6eec694cdbbbef2c9793a1413be2828cce36c1", + "sha256": "c17f9cb3942097db7e1cc51d94d570e1c1a1a5fe31649a8d098362d756556f03", "shape": [ 640, 512 @@ -5000,7 +5014,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "6fb8d80b3587c6f014292d592d6208d3bfea3f7b9cfb6fbd95b04abd470a30fb", + "sha256": "e771a85f2c8eda7bd2e67b1eb563931e0cf9ae4d9170d42412649041f6bc0ba3", "shape": [ 1 ] @@ -5061,7 +5075,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "e51312cc484dfd598c10b167dbe6af940d013b5aa895d68abab0ab1ddd423d40", + "sha256": "bcaa3d82054320aee69a8fd250931d0f7769850b1b400d9cabbaa255363aa82c", "shape": [ 640, 160 @@ -5071,7 +5085,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "cee5a232daa2cac8d840a8a5d0710102daa58b71fc593bef0d596bdad06d3423", + "sha256": "ca2201ef58bdbde2cede29914dba3c64d4d39d0ebeff16d113af8159ac009a40", "shape": [ 1 ] @@ -5132,7 +5146,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "48a1d4bb988a8c29875b8ab2d6c68b35b3d85ab70805536da149816d2d905533", + "sha256": "3c208fda9770ebca77af78e09a330a1fa8c11e9be00f68661e966a68a0ccd48b", "shape": [ 640, 160 @@ -5142,7 +5156,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "748fcc632ef97bc835054dad79fdd28617c717337ad6634c8739aa30ff8f9735", + "sha256": "858f9e7559d0bb7fa3898567404a3201cda67a783485e1a3396fdf3e3b795553", "shape": [ 1 ] @@ -5203,7 +5217,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "3e474c856099c6bd35589e0f8b44adc02cf84b23065f9ba12ed2cde5cc9b8aa6", + "sha256": "03e84f866c79214ef48ef38da73e63d1be13e26bfab9d4650683bae5cce3a6be", "shape": [ 640, 160 @@ -5213,7 +5227,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "bfe670f9f0bc7d426d00b6397e8b6cf6845c80ca0de48bbe3a49a55ef9f36b64", + "sha256": "e3b03dfeea5a4d388630b3b2851b6108a4ca1a1c79c79840fc0c581906782179", "shape": [ 1 ] @@ -5274,7 +5288,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "ff3d352a5e8801005b686799c2b163747ac4a997932bbb835a0d495015e8f37d", + "sha256": "8130120224c1be33e2655bb591eaadccbb788a00d7394160ecbeb705144a92e6", "shape": [ 640, 160 @@ -5284,7 +5298,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "5f5e4618fdc385f02530541d266b2e95d8432cae68eee49ba7284194bae2b6f5", + "sha256": "4c16a2df92ac54a79278c22bc3b52537301a6420a746ce41f227ca99620c8ff9", "shape": [ 1 ] @@ -5345,7 +5359,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "c76b3bab12b71b791c49f31aa6822de42d602be8c2bf08d50435ec40616d3135", + "sha256": "2a17cca01d8239ae17510fc30457db79478b8cdc21c4b87664d82d542a68d00c", "shape": [ 640, 160 @@ -5355,7 +5369,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "137fa14f376bcba4bd21d5e2041af7e66bcef81930584cb571482bdd9fddc088", + "sha256": "b28cbb207d7fd7186365278550c51df45cffb220560a46ee104e47df984ae3c0", "shape": [ 1 ] @@ -5416,7 +5430,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "577097cdab5aee51810dfebfa3223a3fa586ac82e08e10c817e7bb88823e6dc4", + "sha256": "8f097d5ab440b0ba3008ce087a47bd350198dc277b19a0b82252902b4c6d16cd", "shape": [ 640, 160 @@ -5426,7 +5440,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "194e3450e17003176706c9ed62806647d70744c5d5aece49e0a1932dbb65252f", + "sha256": "6f9f17178c426f37dc84f6ff8c32e58375782addb3e49d98e967be1c9a4a8e6c", "shape": [ 1 ] @@ -5487,7 +5501,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "b409802e35ff1ea6ed39862aff9c220ca09e151a418b8cc3d528d12d70094592", + "sha256": "471b4a37f66a8b5583d41e02415a96aedd833d2b0b47bdec1aa8e897b2f32c78", "shape": [ 640, 160 @@ -5497,7 +5511,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "4f3a918598b8fd86ea2a2e2f55ab20ab0e72a2892c37e58bd7da0fcf41b6053b", + "sha256": "05a4de10024706188b2d5a60c71bf4e46da2d0a07a6d4703476f56829484beb0", "shape": [ 1 ] @@ -5558,7 +5572,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "1647314ef6712e6dd39f2e63744b7431135dc2cceabb571950ee0769cee130b0", + "sha256": "e8466a50a9fc2ca4de15274be6b1c5339c6e0c1a3570289a576c7f4c0047d473", "shape": [ 640, 160 @@ -5568,7 +5582,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "57ddc9a933fecf788a1f0dd300a50b455b3698333e3e85b63332f05b9733aa95", + "sha256": "12c229bea058156dee5ebab47b585922cf4969e8cd9f86181894cf04514b2f4b", "shape": [ 1 ] @@ -5620,7 +5634,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "e6525df753e51d34970abaf8d1c40a74b796720c1db712b744e7388fef61e8d7", + "sha256": "907a4a6d6fdb011b6dd5d94b2348e9e192bd9da2dec954ff781d0a1bef671b73", "shape": [ 4096 ] @@ -5638,7 +5652,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "03f29751328c92fab31ad224f385b4be3af4d66bb7bbedc46123ada15d895825", + "sha256": "94ae5ae2753c38bf39ec63d701e65936a38bf557c6fe84fe8dff364884040e4d", "shape": [ 4096, 160 @@ -5648,7 +5662,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "0168260e9d02616ac57d771b85b06f96d3c8ca0b1801b4d8f422d715f32267ec", + "sha256": "30d23be49820704681a3c9e803812639359b86604eb64e30a85bb2db26f71580", "shape": [ 1 ] @@ -5700,7 +5714,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "779ad3d61df709063c357c15661555fb95c87cec16cdc5e9d9a4be9e4ec5cce4", + "sha256": "b2d3870652a5e125759e95b9f86733e0bc5f77d3f6a5cc411bcaa3fa566f3f0c", "shape": [ 640 ] @@ -5718,7 +5732,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "d4a9f2dfebe2c7cc447debb622c90c0cb36b63148a2634d34e0d6fbdd0112e3d", + "sha256": "a83bfd0b689cf348764bc0360cf4408087f5fd10d81d8ba0df42986478fbfd59", "shape": [ 640, 512 @@ -5728,7 +5742,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "1927215e4fa03d29dce248987860d1bfd75b9564af190b51e15e766bfab1d921", + "sha256": "16271011077b123cf1c809483461077673a1b0ea531b4b1c7e3279a9ecbeaa4e", "shape": [ 1 ] @@ -5780,7 +5794,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "a05fd796bfabbcd856a02eecbdf1c61615fc0bae9bb77141dd55c871d87b4fde", + "sha256": "a9f6b4f1fe22589729eb0d737601b23ba4cc9ebfeadd09523d1ae79d52f3907f", "shape": [ 4096 ] @@ -5798,7 +5812,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "254e4df1cacb8057dd692874312ddae05e490c57b26ad1b9ed7e5b402bb7c104", + "sha256": "3aa11246c81fd0bcac67c5f26df2ce838eaa6770c6e8b188a2b1efdeb7e9407f", "shape": [ 4096, 160 @@ -5808,7 +5822,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "d140fa74601073ef9acb4600f6f1bfb6110f72c6d7e082beb6820f0252555a3e", + "sha256": "3281853fb7157f4e1e939dccb4fb652dde048d34458a09602421121869212659", "shape": [ 1 ] @@ -5860,7 +5874,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "c13837272232ed41d7e260f3b31b5626618b8c3d9acc6ad54b63809998ead325", + "sha256": "57e85c9d9fa797c785031a5297b55baa622fe733fc2cad745c4def4220e6de49", "shape": [ 640 ] @@ -5878,7 +5892,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "72ebd4c2d0042090da61dfe3a7ac97a48f195e2ca73e15a689d0457aa10c4f9e", + "sha256": "08c636f9bcfbb566fc98cf944f6410f7d07308c6885130104ba21b645b54229c", "shape": [ 640, 512 @@ -5888,7 +5902,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "fbf47255266bc2a81a08229c4b3ccfa1469ad237636bb161483e3b2d7fb86be9", + "sha256": "93c67e503abfa2b964d6fd04f0da9d415189c99c05d16fd58a003a8819559cff", "shape": [ 1 ] @@ -5949,7 +5963,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "fc2b4a3dda7010193c94d86591e64dc466d629981abb4e008ad60822c1b0c5eb", + "sha256": "a46c45fa4b4aa8fa996feae44e7be7d8820867af2449e0104f53fa6775179fb1", "shape": [ 640, 160 @@ -5959,7 +5973,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "594e276d9d79525ee1e48c2a8fdcd54499ef35e7722735cb1f996b273ca43e18", + "sha256": "08ad6327be95f2e8252c0521cc183e9262c5ca80beaa6d34484189cd74f5301d", "shape": [ 1 ] @@ -6020,7 +6034,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "12099b3ddd6bdaa49ad496020dc79416d2cb6e18f19704bb554190d434ab7155", + "sha256": "71837c8df53923a1eb51839206bc2964dbb5931829c8bcaeda9baf89b1fd222f", "shape": [ 640, 160 @@ -6030,7 +6044,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "18cb18c1ca9df4ce1418ee60984e026d87470bff9d8f4f76327a33de17ed4361", + "sha256": "c0ee0049491ee814569ee869d71112df87a78155b57e8128d03d2bdacf4025ea", "shape": [ 1 ] @@ -6091,7 +6105,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "ac7a8ee517ee14bd8fea44595f29da3148dc5d16b75cd861672c763e16ef453e", + "sha256": "9418c8f820fe57f66a6d297cf58d1d7145ee125e5fed29cad668c4013b55b5c2", "shape": [ 640, 160 @@ -6101,7 +6115,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "d5694a3a00c63856aa4ebaa5123cfa03ea6aa2f9e43b376846a07a55bddf367f", + "sha256": "c006a324dff21858853c4e4aea09fee0a0ce2f52a39ad72e78e7390a5245970c", "shape": [ 1 ] @@ -6162,7 +6176,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "0db7a1ab2c75031956cb3abe22317c64ef8e11fe66ceac512bddcb13d8d23380", + "sha256": "16b3aaee9a4357d85e3911304dba4b92f256eb99648014896c74b67f15a881d4", "shape": [ 640, 160 @@ -6172,7 +6186,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "ff4979e14dfd682175f59a47aabac427a7975f5a4fc223fa72b96cea3c229f8d", + "sha256": "60debbe37b6fade7faf5609fbb09417ac8d679f41834db5f00e7c07f39005e8e", "shape": [ 1 ] @@ -6233,7 +6247,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "e128832a8ecf3aeed808b74d87dad67cd255c2db6a17b162eca7d3127493bf19", + "sha256": "b80420f9122112b055341b9e6744e99760716a5b5ab9a8d2b616a6677fe6e51f", "shape": [ 640, 160 @@ -6243,7 +6257,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "b0e4dcd00804a2f10d5bdd9ef2e26c9827cfa86e628e4a749b1220ff0b323613", + "sha256": "f1cedf6bc25edc3a71af61cce2e793f02054ee85707373183901a6d7bfd9bc02", "shape": [ 1 ] @@ -6304,7 +6318,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "7163115bc71e1a6087c257f47f457a601f61df0d0a68ae7ddf510c2bd610247f", + "sha256": "df6b0c4a3539a35bc6bf6a933fdc949458d51ef7c699f56da3b7d39a7298c735", "shape": [ 640, 160 @@ -6314,7 +6328,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "22b15efaa6bed88b4dff49d05a51ffefdd2c7ef81ccc4791b41ea5f4c93e0fbb", + "sha256": "fab7acdb1c2d26fec9ed3d0d00cb625d1d47f26530f0526554fbe35d12409b1f", "shape": [ 1 ] @@ -6375,7 +6389,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "523d4f77f2c9a7c743935466c972cc168287e14dece99d40238b346fb27f97fb", + "sha256": "1a2cbf704f1f495d86f0dcee2ff15a889756988f9ae0ac8b74545dd27c9def2b", "shape": [ 640, 160 @@ -6385,7 +6399,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "9b9fc9730e2c668496ece1d4a5de9763bc44f2671b241a1c1debbb5ced26bcc5", + "sha256": "df1ad53be309ab52d1870c805583bc8f1f5747febc64464a8ce2d871b91c11a9", "shape": [ 1 ] @@ -6446,7 +6460,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "4132a59d48ec7d51ac30c3f4175f57e889599efd7e625c797cbb8b5d831e93a6", + "sha256": "48b06288bc81900b14715d87718e8eeda0c60aad102b2c506db1f60e30426d25", "shape": [ 640, 160 @@ -6456,7 +6470,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "6a6e109563dbf7d40b494d34532e95a304b0eeaaa2eac805d391b0223af6dc77", + "sha256": "6b8105fa87a0c153c3b85b143ddc7d8345e3f5e7b00609d57ecf05ccb37e75bd", "shape": [ 1 ] @@ -6508,7 +6522,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "fa1ba39d161738e5813daf52c5771c4b342fbb0cff72e6f002a4ee2ced15f2a5", + "sha256": "62ee98df5599d0fef4c7e56e802677f5db362fe0f3fb1940c7b073a24ef84a15", "shape": [ 4096 ] @@ -6526,7 +6540,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "84689b32bc8ca799f9dbec89a8007bf21afbbe8112aea203cb54ef49cd0fd741", + "sha256": "6791d3fd41589fab3eda4e56c8537e654686e8a90dbec04bc4f5dca84b23220d", "shape": [ 4096, 160 @@ -6536,7 +6550,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "d2f1117c13f4e19bfe03e087a9701a252e538ae56a8b1ee89e39086101359b27", + "sha256": "d3e6af24929fb6449c2a8510f5ce57d515629a5fa3996f6fc96993a698a8a337", "shape": [ 1 ] @@ -6588,7 +6602,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "a1c186530cec1e3ef538bf7a766cbc32991dddf87af3906987f90cfb231bb7d3", + "sha256": "a98d0431811d1f5bf2c1ebf562d91f3ce65d75d64520575efcfcab46e018b2e4", "shape": [ 640 ] @@ -6606,7 +6620,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "243056cfc23ab07879aed6d68e44c4a03bce85cd1d33916cbddd05d3ad558647", + "sha256": "71cab0c976abb9f5a8f17da4cf8460f356e31729d1e0593a2e5aa88e41a458f6", "shape": [ 640, 512 @@ -6616,7 +6630,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "23fa500a5c1d7fe55f6d2e59c571d48b88c9dec6c1efe09f3f3f4cffc4d0adbb", + "sha256": "2795d779ab9f77b8fdf7d144a1d92a34d68a4af9dbdd2f7594fdcfecde3abadf", "shape": [ 1 ] @@ -6668,7 +6682,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "760c1ece295a8913e80f14927e266520a947959aedcfb2c38b58af2f920b2f5e", + "sha256": "8698835f3c913ac1a26c481cbb8bfd690bdfce971922e3d7d541a6d7099e3977", "shape": [ 4096 ] @@ -6686,7 +6700,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "4d52aa7e8602cf434845d833c7814f3d81462b12497e429b61418c0b81b39959", + "sha256": "375345d99dc960f212fcc7ab73fe74e618167f4bacb0e34b3d5fd75682efa4a9", "shape": [ 4096, 160 @@ -6696,7 +6710,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "f7a83807f3dc29cf15f6cc3e6dd2c883491029cd88085c34661ae464a2d7c2b4", + "sha256": "a93671fb72d1708202ce8296acc051d8cb6e1161c733425448bf66fea20c1115", "shape": [ 1 ] @@ -6748,7 +6762,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "43f6f98654b26b0732dcf104df7c540836aad931c7878b05640d7fba87a90d9d", + "sha256": "815889ff5b4eb207d60345cf0edaa41e14ef55598c0c6f30289543589cad84fc", "shape": [ 640 ] @@ -6766,7 +6780,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "607fbcf1a60bcbf4076552c0c51cff2853cf36d2f2b7a6fb02f8624033486b76", + "sha256": "2424b38121121a0387b71c91d153ba9debb8aa9fb2737ed1221c2606888475b6", "shape": [ 640, 512 @@ -6776,7 +6790,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "b86ac13eba188e7744a8064948b792bbcbe74baeeb602cc6d1cdef84bad3b00e", + "sha256": "a104324e1e7cc41a3f01509e6e8ced8e762acef0fabac4544ffb92b443d73019", "shape": [ 1 ] @@ -6837,7 +6851,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "46638b7393c85823b8c15351aa8b337ad6b0ef45d4580ed4d6ed039a056e87db", + "sha256": "5a8b72acd19e793b8c0299c75b992f12f268403a9cd011d6514aff9d3232dc1a", "shape": [ 640, 160 @@ -6847,7 +6861,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "200b76613bfdbe2a0254ef01611444ec15f9de52fb50f81dab3d273b4b96da62", + "sha256": "f0b2ad4c13d7c55058e593fe97242797f9c3bf699d4b4382a1bf45cab3145f3e", "shape": [ 1 ] @@ -6908,7 +6922,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "af216fdafa01c70a3c29f06a2cd89ca7548588df5005f64d722a063e9df46dfe", + "sha256": "d8566006b654e57a85cf7e668d23eb6a8b00bbea8c920c5e3004bac61d165902", "shape": [ 640, 160 @@ -6918,7 +6932,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "040b7bfe0dda2f2e3885d8ac903ede97b7c5c54ff3a60faa0e7b2f8ea1b24eae", + "sha256": "92d66a55428f7813a0c25bf7ea743cd5fefba17398bd3cded05ceeb46fc4e665", "shape": [ 1 ] @@ -6979,7 +6993,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "74a9caf4caf5cf52645f81f8b0fc823e42084f822da768e2614e6066fb892581", + "sha256": "db853386ca2135aeb2a21e4811a96f6a7f5e38ecc356057cd61826dc281c9a1f", "shape": [ 640, 160 @@ -6989,7 +7003,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "6bdc606c42114297c497963ca58b5bb3be4ec11ab89424a9a1d19ecd9fbb84a0", + "sha256": "01159e95ff778abe2236d0492dfca3d20d14a6b3848f0583586174cbda64aaee", "shape": [ 1 ] @@ -7050,7 +7064,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "00e16ff3ecda8c9f89eeeee4f1271e9f7b7807571970e15c2070acd6c7a36190", + "sha256": "56465616cc74db684e4cf91b6a4eaedf20d2dc0fce3d52e80188ad2ff4b17bde", "shape": [ 640, 160 @@ -7060,7 +7074,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "03a834edef6a098c2fca9315a4167ca1be9634782657a9909fa48bf313711a04", + "sha256": "64be926fb8e3f7186096dfc7d71be5ef1c3adc4b3ca4cac933399f06ca4128ef", "shape": [ 1 ] @@ -7121,7 +7135,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "8f97698724d741ad7f51f5dba3d951f331ad800efc11f922b102865baffabdd1", + "sha256": "11cbf72fee9113e4c199fabd74ed6b5292b90eaee86b44c1adccae8ccd942783", "shape": [ 640, 160 @@ -7131,7 +7145,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "a2632ea079b5113f382e81cf1782633e02e9b4ed1146c56b171d669602897ad3", + "sha256": "6e0380b2fb97251dc52cde6bad28c297473604cc977a027621c9baf7240444c0", "shape": [ 1 ] @@ -7192,7 +7206,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "477aaa3e3dd636d2a857add391fc8a3a2f4fd26fcbf30b3cf95438cbd590737e", + "sha256": "0935f374bd55ada307174506bc24bd4291f5c72db145af937ecd472267d646ba", "shape": [ 640, 160 @@ -7202,7 +7216,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "92e371e8f1578aff6796f3ac4975c287e5d63174323035efffc1c931fce54f2c", + "sha256": "87b6ef8c6d77f5a498047d9a58ee6fc5e3296b67a4909aff8735fbb783a18b0b", "shape": [ 1 ] @@ -7263,7 +7277,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "0acd96871682cabaeda0c52a369e3320c4fa2267f2447df644f5ddfa00807a9a", + "sha256": "1a2937c81a609059d506dc0346018eaee4ea694d4ec4a28ea2f216cbf9fce034", "shape": [ 640, 160 @@ -7273,7 +7287,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "a2e18e9c82d54908c20217100cc44da0690dc7d126e8ccaff3d55221cceea5e1", + "sha256": "0faeb054329b75c4b46fff740fb9bff988744aaf029feb19b27698d926185604", "shape": [ 1 ] @@ -7334,7 +7348,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "10dfd78a5e363fb05309f0fa3ca5a8fa688683439e799e2bf5190fad839f07d8", + "sha256": "e6adc5855efc0bb782aed30cbe0c6a1b2f8c80608739c6c88fdc871a8499737d", "shape": [ 640, 160 @@ -7344,7 +7358,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "6d5cc8f071d2dc9ffe100d11d0b9f805a71ec3f0e1dbe74a4e28ff79176faca0", + "sha256": "ff846e9985573ecd305b77a54a7e988d2144dc5adf9a6916813d435e9ab561cb", "shape": [ 1 ] @@ -7396,7 +7410,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "b55b6b210e332ecf839d8e181f76fd76be84b835972c103009c2b8f42b105017", + "sha256": "e849a329a8fad72a3c78519452879346d4610159c55ba54cfcb9b781f97cb30e", "shape": [ 4096 ] @@ -7414,7 +7428,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "61423b913e96c820c10dc2a26cd5c4de3e998b1b04dcf2fd4a41aed1e738cf7f", + "sha256": "b42b255a137c29ef6f63d5c24a0fc97de401b6f9b34d30df779ba7118912e2e0", "shape": [ 4096, 160 @@ -7424,7 +7438,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "08f0a86a075e56691e5f5e3bd404c005147007c9b6b0571b8bc8c07737aa3d67", + "sha256": "c7b72990e8b2ec40c9892aba65b9cac0622cbc6ac1ad1963be6f12c45530c560", "shape": [ 1 ] @@ -7476,7 +7490,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "9f1b6d2c15741c6eab8cfacdac19bc54f431fd2432c2f39afa48b6058f1f343e", + "sha256": "2c675afd5742963783bf330d279082e56a8b5538a9939e168179c89fee8da7fa", "shape": [ 640 ] @@ -7494,7 +7508,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "b695846f6c7cd7fffbb50080475d1b2f18cf5312be049cc47802b9bbb23aa497", + "sha256": "ef232657569eff68765131f1f78eeabb02eb1775709955e07c99ba4440570bd3", "shape": [ 640, 512 @@ -7504,7 +7518,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "91fc9753ecb2e9d8f4e37de4aff3cf86d17969af54f6200871685ec677ed1ba2", + "sha256": "00ff62715519571ab08949ecbbb673535a3671d32b1a9eed572e5bbe7aad8b7d", "shape": [ 1 ] @@ -7556,7 +7570,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "e836b2102f7f826f339bc7b014e07782d3a748c773f10ba3b01b940d29b44182", + "sha256": "58cb7e7aec507f1957187d6fed32241c60b2b5d26382faf9ae0a6bb6107ca974", "shape": [ 4096 ] @@ -7574,7 +7588,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "ee9a82a04d0e4459c4cb7f94c28d2686ddae16e6668738edfa76cd8a013666ae", + "sha256": "870916449e436f9e60f60ea3e12f3435e863dbc0becf7b04705ce6f03206a44d", "shape": [ 4096, 160 @@ -7584,7 +7598,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "65639fae837d12338698909216342b9da9ebbc2c75d3058b73fe5b3d8e342350", + "sha256": "2e4e7df77ff5c2e5cf71328c80f8ec401a6f624e683790badd0b7aae32da3c2f", "shape": [ 1 ] @@ -7636,7 +7650,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "ce15af4c19781b8525971868cc9fb94e220f1867242fa7faa61242529661471e", + "sha256": "e39e3873069fd6a675cfc178936887e12f6aa51d658b846ba25a978b9cabf735", "shape": [ 640 ] @@ -7654,7 +7668,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "6aa023b652ea8cb4c15cda43b758697397951ca79dfef5767f4bd1e0da99ecdc", + "sha256": "0d20e20a86bc772bda2b92d98747d3711be44c4d86cbca7c3984026cb346dbc6", "shape": [ 640, 512 @@ -7664,7 +7678,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "20b79d91f90bd50129605b252e0a23dcb120666afac4e988e997b4cd6496a4d1", + "sha256": "91a69820c780a5812087ade3eee56f8fa3fd4ecb49c52fbc788ebf537cd87df8", "shape": [ 1 ] @@ -7725,7 +7739,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "b6abce78b00434b9b260f5dc37b7b7367830778dbceebd3a9d6f8527f9c99d86", + "sha256": "45826f137d54cbb649e5c6ae6dea1810936c192577dad65f1e7a847984a81004", "shape": [ 640, 160 @@ -7735,7 +7749,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "666df0214bb1e28eb5f382b2b12181fcdf9befbac704d819b8c60fd9afa91a1a", + "sha256": "33bccb48e0d40c9dc8eb90a23cd8c427e7824f1c930fe20d90589cda3f5bb030", "shape": [ 1 ] @@ -7796,7 +7810,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "1a6452884ccdc02ec802da82f200c4a80aa1e2b090849decc9b51230e621e812", + "sha256": "e300586d5091990a15d12e681e43cfa4a00af31f8a6f886e446f770e7c554271", "shape": [ 640, 160 @@ -7806,7 +7820,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "f3d67151d91e46353e8674137bdfcd58cc7c68ba8effcf87a6d0e4539183dd63", + "sha256": "b27f63a35dc17e8b23a4dbe85408fd3350d5083c9c8312fd18ff16345eac0a84", "shape": [ 1 ] @@ -7867,7 +7881,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "be998d5ab45cd4790a8c69a33479b59f65f938618ab7e8fbd56a7b19ff9abfad", + "sha256": "8331e844e9535e0c325edd19e161c13edde32ae663380da09025993cdea60422", "shape": [ 640, 160 @@ -7877,7 +7891,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "4f5578ec265f37dc898731cb72c748c24e3e480a64d5788c1815617687d3fb24", + "sha256": "2d4fb5a2384b1b4bb2f482db3ec538d363a09e046dbd54e882bf784c6a5c08f4", "shape": [ 1 ] @@ -7938,7 +7952,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "abac573fcfcb72212c55adb43bc1db1967e7e78a374ec940eb6c4f5d635ea06d", + "sha256": "5373c29c4a939b97eeb54207b6c441a0fead033399cb00e36beea3dbf941bac2", "shape": [ 640, 160 @@ -7948,7 +7962,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "c6799bb383071e94dfadf6573f0416870ef323ebeb31e87626ed137e44c98c6c", + "sha256": "3d1728382c159072d32f88230a61708e950d6ff133929cd12dea8121d83071c9", "shape": [ 1 ] @@ -8009,7 +8023,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "bfd163ff0dcad21ccd7fefa73fbf79ac9053c709a5717e10f75b6fb936dc8c6c", + "sha256": "f89dfef1e375b5f6cddb72810c8f43663550c1f6617a0689ebfb9ac9d71d6ce2", "shape": [ 640, 160 @@ -8019,7 +8033,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "7f4810a434b0a8dabbb5eae5b0fd327442680722039f8645b6bc00ffe3654ce1", + "sha256": "86b0c2ce4ea6968b0d5bfe161ff5172eccd9b6ebc1a81202bd03f0d21394be60", "shape": [ 1 ] @@ -8080,7 +8094,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "c42933ccb66f22357bb4e6d65e94956b9d818f192296b939f38847111fc520f0", + "sha256": "0ce39dd91774074736c5720d2ef64ecab695ad08f57343d5e2c97b11448dcf18", "shape": [ 640, 160 @@ -8090,7 +8104,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "a0bc89dcf0a96b2ae6f6f5c25823f4bff2d2a01eebf4532f8aa65c79c4643bec", + "sha256": "a1f0f48bb45d012edba1ff192711ef50e47cf6a92a0385bc9e319e3f2478476c", "shape": [ 1 ] @@ -8151,7 +8165,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "566aef9b1805aaa57df77ebf90224e82bd2ff3d6a815249d03e5e11c5ed1c23d", + "sha256": "1a625004d390f89ba744f0e76c635ef5ed804ebe321d4468558a81037c02f97e", "shape": [ 640, 160 @@ -8161,7 +8175,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "9536ed49e49bbd570119049a0116e4d11b8198a1ba378c107175ee7333d72ac9", + "sha256": "9df9184076a41b00dcac5ab27177869f612ff7b7f6f9fa2e86940b111132a375", "shape": [ 1 ] @@ -8222,7 +8236,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "018bbaadc1966a49cc913b807f3a54465c8a0a2a1f566e91a57c172a0624bb2d", + "sha256": "37f9d08deeb5da3fd5917e830b09280c2ef8698f513cb4fbd48d441278b63d4f", "shape": [ 640, 160 @@ -8232,7 +8246,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "8a67d2ef56ce256ac2ecfabc2f78e2c28089507c9715d21fce13153ea0a93cf8", + "sha256": "6d056c23594e9fda03e1f0045e7bb77bd977c7ad97ce3facd6079d7e21539692", "shape": [ 1 ] @@ -8284,7 +8298,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "504553e77c868b26f1e9a3df5d802722876c10ed42a3022eba8fd37483108c12", + "sha256": "d15970cd583a238ef5df0cba7c57f0f0ccea9051feef6c83b10eee60a2ad92b1", "shape": [ 4096 ] @@ -8302,7 +8316,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "0ee380e03abaa8eb75539e908a009a2c0fab2af231ebf9c77ccd8bea01625563", + "sha256": "a0489721b293b3ca1fcdf662c044237b0ae07aa9ae460fbd66d6e4d4edd68b50", "shape": [ 4096, 160 @@ -8312,7 +8326,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "ca2393d1d6cfc924d3705620afae401da0a1057cb70a627a762862d880e4dc57", + "sha256": "a877c0e3d34e4de0a55784c90a53c41193d06d932cf356643e0c9c39bbd877d9", "shape": [ 1 ] @@ -8364,7 +8378,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "7e2f8fa91fd415e7df8c55898beae2a32c79635c3f3e14d7f474dc27d7fe7e5e", + "sha256": "c4706434e5600143b8000b42086e5876cd70ee3f705c9b6f660650e61e6704e0", "shape": [ 640 ] @@ -8382,7 +8396,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "6ac53ae9a8d1b549675b173632028543b73aee8bdeb52165739a5dfb8e01dcde", + "sha256": "f902606d6093a73f74866075bc990c9b1fa21f5ac3918d82d52531a6e6b27dd1", "shape": [ 640, 512 @@ -8392,7 +8406,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "17a1ad12c4a297e3333fd1a00dc1afe0651cc68e2f927a9c92358990a400794a", + "sha256": "5ad60db274db1cfe4f344945fc6a354a9a75fb2666c99b8d13a85eee28be1b57", "shape": [ 1 ] @@ -8444,7 +8458,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "7758b963a9e36525d1d6d49027aeab3647ca6c3b9a60dce81d38ac5cd041fbdb", + "sha256": "5fbdd191cb5c5b15dd436bb0eb61d75f4dd1ffcb139d867e7ec1362a6f698d78", "shape": [ 4096 ] @@ -8462,7 +8476,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "ca50cff4086a68e7b381928637256fbafa7ab0b4d7e7db18c98ff7bd58424879", + "sha256": "324d5b0baa2bd143549f6b876e4847bfb14df87e6f4c5f2ed8c38f80f7a1bd60", "shape": [ 4096, 160 @@ -8472,7 +8486,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "b34e67e0bd1804287bd6304f8909fbcabca41c8e33148de56b51cd82bab0de62", + "sha256": "a981bf8cfaae486dd857b1fc89be565b3858c02e7fd79d6213ff125ca715fe5b", "shape": [ 1 ] @@ -8524,7 +8538,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "b280eafca25a670d2e9f3ea5fee996077207399ced3a43dab27b982a316bb5c3", + "sha256": "c8d46fdf1ddf2b1b8aaecabaa8e43068f74bb265db62ec27e7203ef055f8d3d3", "shape": [ 640 ] @@ -8542,7 +8556,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "a1bb7afec833a278d841fef92fa2aa4144638247087fbcab89f9a664dbd16013", + "sha256": "d11e2e2807b998655988a6994f40b12f1147bfcb09e1d212a6ceddf86a8b9d70", "shape": [ 640, 512 @@ -8552,7 +8566,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "92b557a7c755ee619d71c405bafc0e40db3d479fe5a6c9bdb7379d5f212e6904", + "sha256": "9d419ffd1604b3adb24e2f51c7707ad3bb3865beee1f25bf19e584c09768b3f9", "shape": [ 1 ] @@ -8613,7 +8627,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "d15bdb5385f8931d59f913e96be21e5521149624139ef72e734f73d61af53c2f", + "sha256": "63ac0aaab6fe41d627f6cc07bb5e3441fe952761555f12f828a71b26612694b0", "shape": [ 640, 160 @@ -8623,7 +8637,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "0217589c56e8bb040880aa2ce7ebdc3ac5f250b12b8a11787a253143634b5bac", + "sha256": "3bacc7a7c0e98bfaaf14ba92c4287fdc929b5abc536607a4ac005d7f3c9fc06f", "shape": [ 1 ] @@ -8684,7 +8698,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "168f0686219feabfd7985ae44027f4b62a75a7031d4795d7098ce9d02c251032", + "sha256": "bce33f116822eae9b8b4722529395182e463aad001e3a79d16808be7b00dbe19", "shape": [ 640, 160 @@ -8694,7 +8708,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "342fa912e6c7400ed8ea8b18c411f406a024ee0698026e1b25641814b7278261", + "sha256": "d803f9f462591e86f4ab0c448526fd033b3f461206d329cfeb14261ae12d77de", "shape": [ 1 ] @@ -8755,7 +8769,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "d1ee78fe8bdf9a01d8f82e6a22aa1e182407d7d4670a87d5e21bf2a34fe442d3", + "sha256": "a3207da1809eaa7cd2cdb75e16ee500c93759b4dd5e45c39ca8f239312fb50c8", "shape": [ 640, 160 @@ -8765,7 +8779,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "e38daff351bac7c1f9b9a4f7295119cb303c7037e12027fb8a36effbdec8190d", + "sha256": "d6a96d8269d69aed28e0b1e4bac833243793b2979d819ea9e307efa2868925c7", "shape": [ 1 ] @@ -8826,7 +8840,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "b22c7b2bcb868951760cab5ad05607942978b83f1f54e50269dd2a894b292ee4", + "sha256": "0bcad956e60d87582886abe3873b73c31c6421dccd07ee572bc3ebaef8b93c5f", "shape": [ 640, 160 @@ -8836,7 +8850,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "1cb27fec2c7867c8c1ebc9ae311f80dd146d9d35536fcf71fbb63e38a4fce3b4", + "sha256": "6558f786b4707e9a74cf3b309288f44bab2fe85d7c2bf63d8191ce5d7717523a", "shape": [ 1 ] @@ -8897,7 +8911,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "210c10daa667e6479481d6d3ba2f0ef98b5a7e3f0bd9e853f61937c966a5663e", + "sha256": "0d27485165aa65ac9c0302c40afb801f24550eb5e02761361021024fa58aa45d", "shape": [ 640, 160 @@ -8907,7 +8921,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "63743e12bc6c750bb6ff44b421e2eb455acc1f894b52d27c31a9db927da15569", + "sha256": "d3aa0d2be93667164d611db40a95d945427af758e978c9f51df73d98e33a65ab", "shape": [ 1 ] @@ -8968,7 +8982,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "2421fa0bcf4fb2ff3e2faf11d960666dba196f5265ac3c0c07205ec7e2188589", + "sha256": "f24322858b2d972eea75e282e3a7a48c77cbcad77e8bd6de7e01e15dedf32329", "shape": [ 640, 160 @@ -8978,7 +8992,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "a6e13b8b98f8f3a56588c424d0f0eeb2d97ee80fcdf8391d94e81fd0b041ea63", + "sha256": "6e9a8bfc36c2e35971e6976656299647b36e4a24e164890b98bcc4e70110e76d", "shape": [ 1 ] @@ -9039,7 +9053,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "e99e62d118e9ee188448b44590afb392c48a14422a7087ebe14fad5f1ffcbbd4", + "sha256": "0252a685fc4582f57ae143d51ce3fb8973e098e24c9978a920e2d33fa4d59e98", "shape": [ 640, 160 @@ -9049,7 +9063,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "d031e5ab601acfeebe4a5f573155fd552b2f9ddd44bc9920b6748d3915704fd5", + "sha256": "cf740bd129cdac2d57821e98aa6b0589bf055d31c0b0e7a8ec7109191d803e08", "shape": [ 1 ] @@ -9110,7 +9124,7 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "beab9c7f54cfb1f245c0860f6fe4a8e1cf07b68ccf2100119184d157905e6e0a", + "sha256": "8925a3109acfe4a65b89a643b38a980440ad8000565dbcd68fd8d9128091965a", "shape": [ 640, 160 @@ -9120,7 +9134,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "2b8adf007a2bddfd616002af4fddddac73e836196ce335a5fbae84bc40f3b7de", + "sha256": "6d7e412565361ac5fc632c4531b71b650dcc98ed6614078fb82db77a0fbaf7c7", "shape": [ 1 ] @@ -9172,7 +9186,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "2f895fa89f658cf7074483d010ffe6c7e8fe79e24c939268b27b8ae0c5a38415", + "sha256": "178e819216d729a089888c37140a99b1337d1b8866b2ca2a3772bbfa80d8384d", "shape": [ 4096 ] @@ -9190,7 +9204,7 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "41304fecf261465ff3847dbdee49472009d2a3262b8dbf7fecf31ad0854dc5b1", + "sha256": "1098e01a4c56b23c62db470d2def0e876e78074521a6f26fe101b323ef914b8c", "shape": [ 4096, 160 @@ -9200,7 +9214,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "c347d522ec28f95a2e57dde268763d465598af66efe957ecd9250e87f8cd85a9", + "sha256": "689b925a8e9594e32ed35cca127e7146ab7c932b50f31091455c2ffef93ab574", "shape": [ 1 ] @@ -9252,7 +9266,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "9bf3661e4bb1f05bb419ff26865cda4d421d7abd79d47205791194e1807ef461", + "sha256": "05d28eff762fb39a07cb0f87dc407b08eb966482efca2d63556b1803eacfd613", "shape": [ 640 ] @@ -9270,7 +9284,7 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "90ae1df6b88f5d3a90f4c345eb78be91c4aa0879c80360b5c3da63ac2f2ea568", + "sha256": "02b49be34e4473aaa3a36f63004abd08395cdfa30c78f79f1aa8ecad314f6e3c", "shape": [ 640, 512 @@ -9280,7 +9294,7 @@ "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "c0ee1efb333a2d1fffc03499ffd31475c523a2f72a1bafc7adff7481cd6bb559", + "sha256": "51beffefd5a05dc7fb21d6f8fe7e22f4fe5ccb9e91f1038a829865d23820786e", "shape": [ 1 ] @@ -9341,7 +9355,7 @@ "bytes": 1313280, "dtype": "uint8", "path": "lm_head.packed_weight.u8.bin", - "sha256": "5f9cd1687384a4f22ee9b78faa44a3b66113095161374ebc91d6e6f9b60a6ea4", + "sha256": "d077cc31fb0f453749ee885c7dab678178e198916cf13735c2e8c621c200c123", "shape": [ 8208, 160 @@ -9351,7 +9365,7 @@ "bytes": 4, "dtype": "float32", "path": "lm_head.scale_values.f32.bin", - "sha256": "1aea5df41f70ea50217f47189f39b5750d114865679ec371f3b68804875da176", + "sha256": "4a6cc0d1c16f482a50974679ef9b7ef620ed03cdf8354fde8a53acada716c068", "shape": [ 1 ] @@ -9377,6 +9391,7 @@ "d_ff": 2048, "d_model": 640, "dtype": "bfloat16", + "encoder_position_embeddings": true, "head_dim": null, "kv_cache_paged": true, "masking": "build_causal_mask", @@ -9429,4 +9444,4 @@ "unk_token_id": 3, "vocab_size": 8207 } -} +} \ No newline at end of file diff --git a/modelcard.json b/modelcard.json index dd96c8f708c1abd016115714e8475e4afa40fc3a..669010808ddbf62dfd532698f895da319ea6e5f6 100644 --- a/modelcard.json +++ b/modelcard.json @@ -1,5 +1,5 @@ { - "dense_tensor_count": 42, + "dense_tensor_count": 43, "format": "browser-bitnet", "layer_count": 109, "manifest": "manifest.json", @@ -11,7 +11,7 @@ "webgpu_js": "runtime/bitnet_webgpu.js", "wgsl": "runtime/bitnet_linear.wgsl" }, - "sha256": "acc61a1a58ecfe0a6ba6ab22a5b8111370c8e2b497b4419239e6238e1e9fa1a8", + "sha256": "9517eadcd016bcfde27cb836d8126c04a3a1bb728b96c36ff3f2c8540cda3526", "tokenizer": { "bos_token_id": 1, "config_path": "tokenizer/tokenizer_config.json", @@ -23,4 +23,4 @@ "unk_token_id": 3, "vocab_size": 8207 } -} +} \ No newline at end of file diff --git a/runtime/encdec_runtime.js b/runtime/encdec_runtime.js index d971c6cb100d4e64ea926a9e427ef53c20633f6d..963215111c9228075e8029d3b9290c57a49e17b9 100644 --- a/runtime/encdec_runtime.js +++ b/runtime/encdec_runtime.js @@ -104,6 +104,17 @@ function embed(tokens, embedding, dModel) { return out; } +function addPositionEmbeddingInPlace(x, positionEmbedding, dModel) { + if (!positionEmbedding) return x; + for (let t = 0; t < x.length / dModel; t += 1) { + const src = t * dModel; + for (let c = 0; c < dModel; c += 1) { + x[src + c] += positionEmbedding[src + c]; + } + } + return x; +} + function splitHeads(x, seqLen, nHeads, headDim) { const out = []; for (let h = 0; h < nHeads; h += 1) { @@ -411,6 +422,9 @@ export class BitNetEncoderDecoderWebGPU { async encode(encInputIds) { let x = embed(encInputIds, this.tensor("enc_embed.weight"), this.graph.d_model); + if (this.graph.encoder_position_embeddings) { + x = addPositionEmbeddingInPlace(x, this.tensor("enc_pos_embed.weight"), this.graph.d_model); + } for (let i = 0; i < this.graph.n_layers; i += 1) { x = await this.encoderLayer(i, x, encInputIds.length); }