diff --git a/web-llm-models/v0_2_30/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3908c90b47fb4eae5adbd764b357a32629764771 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78f2c00a22d6e1618222402be2bf0dd6525722b31f394fdb1a46c9816160a44 +size 4000074 diff --git a/web-llm-models/v0_2_30/Llama-2-70b-chat-hf-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-2-70b-chat-hf-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..17050fb45d422dc91554c006c71af743f066df56 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-2-70b-chat-hf-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31803d87eca0913d7043e832c8f93c54f94ea8a7e285350f2d9bbf9a51a03066 +size 5088677 diff --git a/web-llm-models/v0_2_30/Llama-2-70b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-2-70b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..425fe2541dd29e02a869d3cc216984d6f98fd8b6 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-2-70b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6bd27a64a17c8e50ba491b67386281712b1965b7ddb40dcf64273c58888c46 +size 5050091 diff --git a/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8536caecbad4d0f8b7691a65e289e80d9c9e8249 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d973a204e9da3f4dfcd224825440f2f7e2d79c8f145091a147c3fae6bed024 +size 3755714 diff --git a/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9d9c1ba6b867b8d45e62fe718851158abd8ae0ff --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5c586d0d2cc8aafb540d7dab758a1880d6f411f41eb47ba8f0cda7d1d7f235 +size 3756119 diff --git a/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..32a64319645432e2d9a58a73a44155e6459c6f93 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85975ec6bde81dff5a7506dc2d11db21fbd8e401c90abf06a7cc500277711a72 +size 3646307 diff --git a/web-llm-models/v0_2_30/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..640d050671463bc020647221c3c77fae3473388a --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a88a180704505a432209c3f76ea1b2f1c74029e8744ebb00e323af4693cb240 +size 7167312 diff --git a/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..31f9cfcffb6f902509c02a3c0fe7641518f43771 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6823b0f6aa474236435ca0dd0f7c67f2cca0e6a9e5467f850ab650f4d076049 +size 4718018 diff --git a/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2be85217f70fedab81173c83c6dec1150ee6c654 --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9445821d84e2094957e160239e1fe89e019c3bceec88e41213e35f3df020e7c +size 4723547 diff --git a/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e707395f9dcf74bb94c9b7ab9823ae45fd0feded --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:223957f419543c75b3a1b865e3173eb2d32c774a9772b064199f8b9aa0ecc524 +size 4520045 diff --git a/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..88dddb27692094b955fbd8e29fff93bb1648cc1f --- /dev/null +++ b/web-llm-models/v0_2_30/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2d377dabfb84751b61e96cc44ca1c29c51f370acd5c6e04d431d29376ceb271 +size 4525793 diff --git a/web-llm-models/v0_2_30/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5e208aff1138f1871d3057ad1009324127c519f5 --- /dev/null +++ b/web-llm-models/v0_2_30/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38c244730831d5bd1f05fb51af382239728c5c08e67740893845e4fa3621955d +size 3783202 diff --git a/web-llm-models/v0_2_30/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c87c471e150a6c3ea155c051b6b9affabfb2d52c --- /dev/null +++ b/web-llm-models/v0_2_30/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d8f7f06db2bd041505908205de6b364e02e30c789da6ccfab6296c8db71e231 +size 3676961 diff --git a/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..37e7755e6a3eebe8aa9de25d35c96f282bde5241 --- /dev/null +++ b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74f278bd2e22a9823b7ff7206ec7fc1f6d9df6ec7aad5a4d4116ed7ed45df29 +size 4045134 diff --git a/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..95cb68f8cface883fa4d80a2a8c75182ecdcaeb0 --- /dev/null +++ b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58c74e7f60701a267666cc0fb1a285bbfe2dc1ebc180ac40c96f1ac82bcaae4 +size 4043659 diff --git a/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..87a1d9e2bb77f8f3c1660aaf2af28ed162996b4a --- /dev/null +++ b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c120c6305e1efe9ba2376e413ba848f802501797792f70e0fb69e6051cd37d +size 4025155 diff --git a/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5101364c83ab76e3d3551fd94f87fa9b4882a080 --- /dev/null +++ b/web-llm-models/v0_2_30/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0877749fefacebf0999d895bbd05c5f25f7b891921a44c74b11fc22da27814b2 +size 4023882 diff --git a/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..267e7595564a7e47ad1988a359a33f96cffe1e2a --- /dev/null +++ b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b6698ac220384f2b6112dc9e76d9f1c55b202c659c6abe78e0bce86d9c9f08a +size 3268536 diff --git a/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b93a29f2cfb3d30911845c1298a8c1b3ac6258e2 --- /dev/null +++ b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58cc54315bf8f98e6851f9c810377d86e43a91c4eb75b8f4b5fed75279ce1813 +size 3248462 diff --git a/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8187949095c2b54f568100174377ab4cc1ff7342 --- /dev/null +++ b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e6f746cbd34486e7d20d540643bd1bbd41d48b4de19e589c747caa57fca9ff +size 3510691 diff --git a/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..fc2efd343b7026788369a2d88387d2d1070f6f9b --- /dev/null +++ b/web-llm-models/v0_2_30/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3382168f379740bf73ebbf5b55a19554bb356f06c696e00a91386bbdcee525fb +size 3439397 diff --git a/web-llm-models/v0_2_30/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..70335689505eb9d0a97761fba4cb911bb8bcf36c --- /dev/null +++ b/web-llm-models/v0_2_30/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac65d002c3add9f2c727fc1050c0b0f5dbeebea9434a9c5d9454217e8102fd1 +size 3426696 diff --git a/web-llm-models/v0_2_30/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..50d96a3cab9075d907479564598bb708421fe30f --- /dev/null +++ b/web-llm-models/v0_2_30/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc98b1682d804c4ca1f1ac9c0a16bf313a5f006184c37f887e5fab8491947125 +size 3418409 diff --git a/web-llm-models/v0_2_30/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..db5307bafa41b0076d876f1f19c03ad859129da4 --- /dev/null +++ b/web-llm-models/v0_2_30/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f2bea36f5b9d2c2ad4837313e5ff90132c5580e6396e119d1ab5b351a92ca9 +size 3357441 diff --git a/web-llm-models/v0_2_30/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b2ef61a575bfc48d8e181e7bbbd87cc2b2d84ab8 --- /dev/null +++ b/web-llm-models/v0_2_30/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177c736725df0f91eb6421491baed13817bc45ffa87b3ee3d37b90f832031d2b +size 3359729 diff --git a/web-llm-models/v0_2_30/gpt2-medium-q0f16-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/gpt2-medium-q0f16-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9e140725fe196086a0ab59b58f0a3cecd40e5d00 --- /dev/null +++ b/web-llm-models/v0_2_30/gpt2-medium-q0f16-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3056254097dc3f5483fdef51516d5b1d847eb520aab3e7e3446ea5a30a81b3c +size 3685171 diff --git a/web-llm-models/v0_2_30/gpt2-q0f16-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/gpt2-q0f16-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b1074de98677b01cdbeb503b0679d850845642fb --- /dev/null +++ b/web-llm-models/v0_2_30/gpt2-q0f16-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584cd0b1a56d7b46bd3283a5965a9c2478b161bba2ca0d213d51773289b4f92e +size 3321904 diff --git a/web-llm-models/v0_2_30/phi-1_5-q0f16-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-1_5-q0f16-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d57bc53d9653c7d5a20c69670c0469d8cf499934 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-1_5-q0f16-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52492b33a05317fcbda6110c7bc901458f35ef3be985370a428e08d344d1235 +size 3615730 diff --git a/web-llm-models/v0_2_30/phi-1_5-q0f32-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-1_5-q0f32-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..57e19ce2e7e2807c2c541e8f199e18bc45dd5a64 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-1_5-q0f32-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8dd57a9c011e1a7d45635d3a13eabb7e51ad32492035304f90669347bb9478c +size 3597640 diff --git a/web-llm-models/v0_2_30/phi-1_5-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/phi-1_5-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a2c61017d5c8b20f668dd8c9ea23376ad23fd42d --- /dev/null +++ b/web-llm-models/v0_2_30/phi-1_5-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d5fda186db4187605bd0786f0f1279d61e98e3c2d73d64070eef8c16d227df +size 3722907 diff --git a/web-llm-models/v0_2_30/phi-1_5-q4f16_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-1_5-q4f16_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7e5818fbd009da9797f9671163872187ccebfa99 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-1_5-q4f16_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc09ffd12c91c8f4ed033b47d71860f0ecbf463d3e04e04eb7ab25be80cb34ff +size 3716842 diff --git a/web-llm-models/v0_2_30/phi-1_5-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/phi-1_5-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..4a0059b5596f0642485e666ffd6b8feb1b619c29 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-1_5-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff07062905553d550449280169414db220f8177ad7e0e4a47bd789d225c9af42 +size 3705968 diff --git a/web-llm-models/v0_2_30/phi-1_5-q4f32_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-1_5-q4f32_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b9503772dfbdbb99d45e5ffa387106c958e9ba9d --- /dev/null +++ b/web-llm-models/v0_2_30/phi-1_5-q4f32_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044a910df9ebdaaa6c4bf3faea0c32b15fd7c47ec47c5875922d65be6802498b +size 3706135 diff --git a/web-llm-models/v0_2_30/phi-2-q0f16-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-2-q0f16-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b50c5324cfe8a07ed1f81afa17729e398b1518bd --- /dev/null +++ b/web-llm-models/v0_2_30/phi-2-q0f16-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1e78f7430328bf8817ea385ae2e56f74fff0844a59bb9d2fdde97c08315d37 +size 3706591 diff --git a/web-llm-models/v0_2_30/phi-2-q0f32-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-2-q0f32-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e5e13ec0ef8195808d0be5f1bb064a62ba7950c1 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-2-q0f32-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45483c6812679950b2c2e802f333c20a12a741399149c91e770f8b875c0eca2 +size 3704831 diff --git a/web-llm-models/v0_2_30/phi-2-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/phi-2-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..797c734e0d03494d76fb545622a4fec912426a0c --- /dev/null +++ b/web-llm-models/v0_2_30/phi-2-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad6097925c35134d42aa74dcc1fa98f0228e1eeeb97ff84245bb07bde88f94d +size 3874153 diff --git a/web-llm-models/v0_2_30/phi-2-q4f16_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-2-q4f16_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e4e897340605d2bb1cf79503be2147e91a0bda4d --- /dev/null +++ b/web-llm-models/v0_2_30/phi-2-q4f16_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb52cb8607bc4ba5bea2e41e3f0017fa8a2356e819cf80e8b21ffea7664732c +size 3873139 diff --git a/web-llm-models/v0_2_30/phi-2-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_30/phi-2-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..84e3cdec2647e25654cfdb5f23d80d0711abea43 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-2-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a547dddb660429b029e5c1d56f8ca8fdb51f1bb5c0b1b5800b29f24d5ab2a4 +size 3865938 diff --git a/web-llm-models/v0_2_30/phi-2-q4f32_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_30/phi-2-q4f32_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d399d5fe3ffb4d55358b013c55c16e70560d5064 --- /dev/null +++ b/web-llm-models/v0_2_30/phi-2-q4f32_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e1175d97e3bfd031c4586f2f407ddb17de2a7ff65c4fd7d00771d899a46420 +size 3868789 diff --git a/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5f1f8010787507facd91b681accb0c531d632725 --- /dev/null +++ b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b6aaee15ec3993a77c62b381b9d1d81ffedca2a901098ec0121fbfa9de3146 +size 3692600 diff --git a/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c8ffa1c9195aef3b5d5b602b215b410fcc65aa8b --- /dev/null +++ b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9682df1920b1523a5ea52603b7d5609b70415a3a61cf402d74b5473d2d6e6bef +size 3700368 diff --git a/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5924c9c98e6aa036762c48d5685706f34fa0591d --- /dev/null +++ b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:002494fb0d3612965b878a55b7b97fbd01f7bb71313711b6f412c462473edafe +size 3673424 diff --git a/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..dfd3a7bf563017181fd545b8e51bf5bd73fe2475 --- /dev/null +++ b/web-llm-models/v0_2_30/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c8f7b4c3eb20540d2ab40d0a7fa9e725fd4730d2dad9cfba2f1e966b641cb7f +size 3679797 diff --git a/web-llm-models/v0_2_34/Hermes-2-Pro-Mistral-7B-q4f16_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Hermes-2-Pro-Mistral-7B-q4f16_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..814d83ec6732a7044cd71026208b37ee33bb8f78 --- /dev/null +++ b/web-llm-models/v0_2_34/Hermes-2-Pro-Mistral-7B-q4f16_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc85bfb1bb25e18fe436bb4dd1239acc1817a7019c9211cb7e0bf8e735869470 +size 3888798 diff --git a/web-llm-models/v0_2_34/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c5c2c6cfc761d85d33722c4077029628d9999312 --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f11f0db35c2301adfb4ce77e4f08e430fce0491799467ecebe431d940982b2 +size 5217380 diff --git a/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a7335bed7d683f3853915d88f143b97ad64b8deb --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09883113764ba1fdaaa6b30dd8d1f56585b1d8273f072a6443157205c559f20 +size 4776918 diff --git a/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..145be97a7b507ea5444c67941ff9c6ef7d372492 --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad27f14797266027df84580647e1b4c43544423e605afeb9da444ec44e29d491 +size 4776915 diff --git a/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0e86c5ba088766cf39a3f07f80e81a564c0702f9 --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2376cb97eab019bd58cf8f6b216aefca98871d324bfd04414c6bb3e22cab7216 +size 4577106 diff --git a/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..36a696a2f4b8572448dbdf8a14604e6fc990acbb --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69807e2898b26324e0c0a1478d98430c78aa1f1273c794d845630d6fcab0bcb9 +size 4577123 diff --git a/web-llm-models/v0_2_34/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ba9a1c9de9f3f6fbfaaf6ccde667c672155bc127 --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb18875bb93ac8300fe4b720fbdb7f3ff96b0ade0f0713817d9b363d90a71881 +size 7266794 diff --git a/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..feaa01cac7fe02f69cae8434d8e0c286f818a32c --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45b569e4b9254fcd3a72869fc5f4077fabe927a5368e9660814e58b4e48028ff +size 4804163 diff --git a/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3472057ddee72f91c7d29d87f8d402954d4a5e65 --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2180c17a345801d1ba90fd3c884388a121d13495f6d3078ac14f22af146e1ffa +size 4809690 diff --git a/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c7bb90237eeb6fe1b190a37cfd8d6f279f0d0234 --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52e912b2fa327d38ee3af34bc99314490cf90f67c9e84ba217bb2e1ce2527461 +size 4605701 diff --git a/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7b8569d2ebbb730b2aa1c721c26b42e8d4c7eb8e --- /dev/null +++ b/web-llm-models/v0_2_34/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121a1a1d3d2b2bf304c5fede6873f86214da55a83aead1fe7dfd0577e39a38d0 +size 4606273 diff --git a/web-llm-models/v0_2_34/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b28f057c5e2ddcc2990fbfbbe2f698e8e8e99ba2 --- /dev/null +++ b/web-llm-models/v0_2_34/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ff6bc8221531e710df6db5e2163606e6edcb043d756c8745bf9640f53e2ce1 +size 3947150 diff --git a/web-llm-models/v0_2_34/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..23fa161b3c8fa38156c4ee319442a2e8e2860a26 --- /dev/null +++ b/web-llm-models/v0_2_34/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8d8494383ac4c25aa6f35fbed2305e789b1e508a83c3d02466f2f5e08aed39 +size 3827985 diff --git a/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8b5e3bdb872420dfa3dcfba972fbed8c1ba8835d --- /dev/null +++ b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2def4e72faa862a312b87fab7c8cba6a5cba21353a3e3f1fdb125c12dd257e48 +size 4221627 diff --git a/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..407ae6c5155fc30d6d345c746dd76e7cbfef59b0 --- /dev/null +++ b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac23ad1709a00138323abc095894caf64af8fb7b6bac5fcfc31e57df210a2f0 +size 4215867 diff --git a/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..269997a1790e47c5b9bd1c717fdfded9f7ebd80d --- /dev/null +++ b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57191d0b86d9c71579f3a0ac55f9ccf226a7356d275850d0ffaa723e1695c062 +size 4196405 diff --git a/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0423e85644bf73a774c8a7a7854a22f45fc5ddc5 --- /dev/null +++ b/web-llm-models/v0_2_34/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038975ed6dd704b2982df4a56acfe6f4c1f75a7fae70655b569a21c7eb82dc2a +size 4195596 diff --git a/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3ea4f61685197f92236c9592a1d96010e1b76ae8 --- /dev/null +++ b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a3682a1bd380b55555a927477834ac40ba0f1038d2d8b5a8e373c7b310e025 +size 4062027 diff --git a/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f989422e13da0b2676ebdfdfbee2fe43d9cbe5fd --- /dev/null +++ b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5dd511fdd80350fa4e27cb8fbe9e169aab16f668019a3f191c9ba9acdb9bd0 +size 3939920 diff --git a/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e73e13997c6420ec3e5ae96a34b6f74dd4cd5b2b --- /dev/null +++ b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed8cd4d1d3ca174f7fd2616a19f93e10b465c86bbb77ad7fadace3afefcc5bb +size 4283465 diff --git a/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..88376555c58e2333853827128a1accac9d778624 --- /dev/null +++ b/web-llm-models/v0_2_34/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce04eda4789f265ea3032d947113af5de2ffeaf8e1086ab35fa07d864856da37 +size 4153573 diff --git a/web-llm-models/v0_2_34/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c076f0bb1f6c30c8ad8d381694c547a06c960e3e --- /dev/null +++ b/web-llm-models/v0_2_34/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c68891b865fd0b9036f1c2550247f17e794ce0225575689b5c85b4ddd9290b2 +size 3568059 diff --git a/web-llm-models/v0_2_34/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b64c802724ee680901de29729d72dda462ae0d1d --- /dev/null +++ b/web-llm-models/v0_2_34/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927164f56d265816ca88f1069d4dae3864ae10e7161068802b7a863c41bec1ad +size 3567467 diff --git a/web-llm-models/v0_2_34/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1e8149c561999fd4464014852f940484e59c913c --- /dev/null +++ b/web-llm-models/v0_2_34/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf4758d4247f38fb3c8f1fc333bf7f2c6102028450e7d6fce0f09c7c875df48 +size 3505474 diff --git a/web-llm-models/v0_2_34/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_34/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3dfa0cc8bce40ac47a1be8898f488eb47408e1e9 --- /dev/null +++ b/web-llm-models/v0_2_34/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2fb549b7d2ef58e1a75f159de3443b3dad2d34d6377e39fdfbd550938f68f5 +size 3504892 diff --git a/web-llm-models/v0_2_34/gpt2-medium-q0f16-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/gpt2-medium-q0f16-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..dfb6281bf72c009e92e1e71d67c7f07d6e5e9d86 --- /dev/null +++ b/web-llm-models/v0_2_34/gpt2-medium-q0f16-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01fbf753b1f54464407e02d268a71a08c6a32919a108646a8bff1ef55ed54836 +size 3842397 diff --git a/web-llm-models/v0_2_34/gpt2-q0f16-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/gpt2-q0f16-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ee38e3232afc02660258ba6e642125128d62c2e5 --- /dev/null +++ b/web-llm-models/v0_2_34/gpt2-q0f16-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a649acb4226c8adf55ce38e206f44ceac7093450ce26519ab3d1b6fffb7ae3 +size 3476199 diff --git a/web-llm-models/v0_2_34/phi-1_5-q0f16-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-1_5-q0f16-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..fead1c95e0d7b303f49300f3a5b5bb67f8d526b1 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-1_5-q0f16-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ebba776459c7baed32ed5155ebd87188be5e86c9739b40468dc62abba4187b +size 3777558 diff --git a/web-llm-models/v0_2_34/phi-1_5-q0f32-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-1_5-q0f32-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3f886a4ec213f9b4e953f61241e22473be79cf62 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-1_5-q0f32-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22cbc6d777d84b6cc84e412ef1a9b0143013647ad2341aebac2cb8a624cf522 +size 3760455 diff --git a/web-llm-models/v0_2_34/phi-1_5-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/phi-1_5-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9e5fb1a808679ff0626d712ed0852874ef01c371 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-1_5-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56e87a4bbcab1b0060bb241e52161ddc18a9e25a837de3c6242cf8f6b345617 +size 3897243 diff --git a/web-llm-models/v0_2_34/phi-1_5-q4f16_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-1_5-q4f16_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f615bca71dbb0c5385a096983e3e43234f5d94b3 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-1_5-q4f16_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf3e3869e627c09556c03a3f49e15b495ed84a17e3e074415a7e02d7c68b89b +size 3891541 diff --git a/web-llm-models/v0_2_34/phi-1_5-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/phi-1_5-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b65999a2adc1126f20c76bb4992270b36c72b9bc --- /dev/null +++ b/web-llm-models/v0_2_34/phi-1_5-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42390977c550092a324db54e8dfd8830e2968de47b5bd6621c558d5ff7ad79b3 +size 3879580 diff --git a/web-llm-models/v0_2_34/phi-1_5-q4f32_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-1_5-q4f32_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..78ff7e3f650a10df1c45cd12fc44d9d761f323e9 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-1_5-q4f32_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467d2929a48d5159827614c8a6cfea90aeff70b5a2ca3a53d816512c3c0cde0d +size 3879659 diff --git a/web-llm-models/v0_2_34/phi-2-q0f16-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-2-q0f16-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..aa1e37ae85655a5b44359cceb1e1c3fc88b8c871 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-2-q0f16-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c24ccd73f2eb0a46b56832adab988f1ffe196b4f067bc1d4fb531e7da26d56d +size 3865419 diff --git a/web-llm-models/v0_2_34/phi-2-q0f32-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-2-q0f32-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..cd9834226311eb44c1c055741a5738a53660aed7 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-2-q0f32-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072b406f3521be902388bc2f4b50dbc59f27de737170231f0ec2c0615f03bec9 +size 3866660 diff --git a/web-llm-models/v0_2_34/phi-2-q4f16_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/phi-2-q4f16_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b071b47e6149189991391621e7fee2f82e4dcebb --- /dev/null +++ b/web-llm-models/v0_2_34/phi-2-q4f16_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e22c1de35dae8d1b5085adf8bb961d4b2c1dae8c1feee8b07b4208db9d96298b +size 4038758 diff --git a/web-llm-models/v0_2_34/phi-2-q4f16_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-2-q4f16_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..28fec44f0a3e8612da0d493ce4ba6319b98acbec --- /dev/null +++ b/web-llm-models/v0_2_34/phi-2-q4f16_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c331e1a3b8895bae65f31af04807c65f2fe52710c7a5eb4d62d7e43b5f5a987d +size 4045000 diff --git a/web-llm-models/v0_2_34/phi-2-q4f32_1-ctx1k-webgpu.wasm b/web-llm-models/v0_2_34/phi-2-q4f32_1-ctx1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ab936ba869af05d77a191339b828a5e8ce53c3fc --- /dev/null +++ b/web-llm-models/v0_2_34/phi-2-q4f32_1-ctx1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054b5852eaf38c7bd183a5c3c70ea21df1a8e8d1c36e442844973706b9f0e78d +size 4039951 diff --git a/web-llm-models/v0_2_34/phi-2-q4f32_1-ctx2k-webgpu.wasm b/web-llm-models/v0_2_34/phi-2-q4f32_1-ctx2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b666574780bc76e5b1dd581f7fabd240451df6b4 --- /dev/null +++ b/web-llm-models/v0_2_34/phi-2-q4f32_1-ctx2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b487d67f1009cfc2f92ea2464a97ebd3142245cbe5a9c03480cfeb2d60c5f3 +size 4040072 diff --git a/web-llm-models/v0_2_39/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7b44843ea241f820923a0ffef951ad47961adedb --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ae7b993198c6164560fdedc93b8be30c575377c39dd8a4d0bdb3cb3dea1572 +size 5374165 diff --git a/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..681549b285190bfbc7f4834dc76ae1ac45684d53 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c28b4dcadc713bca27d9ff99c0d27ce1d96b6680ea69bd5d3427bb86a9381c +size 4939881 diff --git a/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..197b8340a6fc5173bfc9eebff71281c0b34218b3 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dfb2eef83eaa21c7b2a62eb6d72849cd58f559f17264355752f4cb5d64e4326 +size 4939573 diff --git a/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3fe2e92f1b140ffa53695f07df78b3a11bc9a1be --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa11af0705bfad780c9ed3dd6bf12dfa889a7f385646c4d3035958ec1dc74c00 +size 4741078 diff --git a/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..14f4961524bf27632d059c4c9169874095a57707 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f7995834e18ffcddc5ca04367e48ca1e33245c6f6d48df7d9c9cd9754f75fc4 +size 4741091 diff --git a/web-llm-models/v0_2_39/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..209b3c57cdad6250b7ae4f5fd1ada3946e417c42 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183bcaa5940e739bc5a5c466a49ff9827d6b19fe0c72000a3af0d38080892d58 +size 7392666 diff --git a/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..eac3caf9fd5301d80726d1d37e93de65091e0ea7 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dca659ebd7f0864e1830ba577ebcee1a074b05ac41514b847b7782c6e61320 +size 4967153 diff --git a/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b9528a6f5ab67a4776d00bbe30d36d9561d90332 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83d646850ccae4560df1e05582ee28f3c706158edd33a35d6e684aa10e60311 +size 4967166 diff --git a/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1c291512bcca48db06c284050a63a3e4f344ae11 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d0e0c46ecc2e97673ba288b0fbd9ba2e401b829f89e76525677139a5deef125 +size 4769303 diff --git a/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c60d58a58f33469496ec5bf14a554d9d2a9287c1 --- /dev/null +++ b/web-llm-models/v0_2_39/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8176afb083e277b60b836eac3c0d384614c911469019785b0475f0358eb09193 +size 4769308 diff --git a/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..864385f8438cd221d1f5f505d7ab7906e6c69746 --- /dev/null +++ b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.2-q4f16_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fa6a701ac049931849cef9d6c6ec58e540a0feeecee367916f902a9e749b149 +size 4117290 diff --git a/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..eecdd36ff19c4bbba556bea316fbd87876b65e23 --- /dev/null +++ b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.2-q4f32_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e6617a6decc412882c8b78a0679d264eadc9cca0f49cf93d415172ee8ca0f7 +size 4003768 diff --git a/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.3-q4f16_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.3-q4f16_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d62af25a56d47e216f2479d3da599e6d7ddf4e45 --- /dev/null +++ b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.3-q4f16_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1cd36ca4981d09b8185470bdc29626c29a77ce4959f13cc05e5a58399c63a0e +size 4117056 diff --git a/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.3-q4f32_1-sw4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.3-q4f32_1-sw4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a6d4eeb02ab84d3834a1cce7fa03527ce7342357 --- /dev/null +++ b/web-llm-models/v0_2_39/Mistral-7B-Instruct-v0.3-q4f32_1-sw4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8968620bd0c417504b50efa314f6fb846649803c52a4e93cddc4462f3111da3e +size 4003935 diff --git a/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..de36f9c8f870e516796ed90cdbfc9a0d6c23f4d0 --- /dev/null +++ b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4baf4fb4f399d08e00a7f16fc7320424137878fc484e798aebf801d3453caf9b +size 4111335 diff --git a/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2502b6272be618b2b83cfc4fab1bb9485e58c3c4 --- /dev/null +++ b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8869f20805a0927536dbe85ca85122336d938a3188c2a4c04f2b13700b9928b3 +size 4111742 diff --git a/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..500c4d0dd31f10ee2f6720c121c65218e1c7fc70 --- /dev/null +++ b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974360bb2d7cb7713b974d3a02c083d478eaa52d42288ac7394703ec7e3a1554 +size 4016798 diff --git a/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0880f9c8da81b0d300a63d962688000b74b93cba --- /dev/null +++ b/web-llm-models/v0_2_39/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727d7590c0f71c774ac19026631f4a286e942ac99a0987870b10da3bd4cdcdf3 +size 4016710 diff --git a/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f6c9419bf4846e93ab63d4d4431526277d32b9c0 --- /dev/null +++ b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eadf922041a91ac6a8c68856c64b894b161d3e9413c78acd6e0bd7d6a9ae029 +size 3933624 diff --git a/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..41ac46f838992d25b74ab2cb4c1e0b9516450728 --- /dev/null +++ b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09913b00eb0f679c9c9dfb20fa360b9da6459de629b35afaf548d73b935aa802 +size 3933658 diff --git a/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..eff26344fb5c61a453f27f2213e7ed88968617ad --- /dev/null +++ b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8b974817e3fbf14c5d2c380f757c6610d65ffacf2bad9338ab8ffc5b52d626 +size 3849469 diff --git a/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..45c91a603faf7c4e74223cd10877664da7311645 --- /dev/null +++ b/web-llm-models/v0_2_39/Qwen1.5-1.8B-Chat-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc7f3edebdca030e8935af2387983db6ef21b2196771621a046b0f3dbbc6d48 +size 3849764 diff --git a/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f72d9a5ee1aab358bbdf74cbfc128d43bc52836d --- /dev/null +++ b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d433036d3dfa9279d6b2f5d5c1388cfc8d2bc0f8ae48c3901dbf2238fb14f85d +size 4391294 diff --git a/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..234ae83df3d60a6ad335954b1afcc7290cde04de --- /dev/null +++ b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51a23ee159a45b9142ce78f1ee13014a9f44163d4feb41ab0cdebf07edce142 +size 4391301 diff --git a/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2ab9e591d4f934ff23ca060c8b2ee951922b0702 --- /dev/null +++ b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bedb5f4d2d2d5fb54262b529bfb908f827241f7bd03603e79e8ea6cb714c3ff3 +size 4371591 diff --git a/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0018ef05c65b9e1c0958588f9db96e099a743d6f --- /dev/null +++ b/web-llm-models/v0_2_39/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f1e03edb56d80e61f1a766b7165a46fcff7ecb0e1b5780ccec57d8b4aa679a4 +size 4371592 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..de703f5842af271ce9d9ca14b7b3d2e57da90945 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb0035eab643184cbf51d1ad65300a8709c83f28d30525c9283fd4e3c9aa45e +size 4234765 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..6f2842d2650b666adbadf1239aef3d6154b240cf --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e73aa524f7126bdc67902190d54aa3f3f76a22f06cf6619b2212546d851964 +size 4113933 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ce5361980e3ad8c4d08c6308c89f15a7baea5665 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b442a609eb1e0811c4e3230370cf35d602fe6fccfaf282b352d5e2945406025c +size 4454872 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..42937820630f59dcd17260fa8e8b1798cf7d0959 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d36c24b3fea8f87eafa17f73aa40156d2cfa9de2b92d54b7f92d09740e6565 +size 4455150 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0d4959beb3eaade1fa50d3d6b362504d880c8842 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8d03f5cb7492ffc296a65d4c2776762a3c62c8d4c8175c602c8923381c5e3e +size 4319392 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..bc41c582e71f4fb30137bf0d6206026fa9e47f90 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd485787c96959d52b01860e369ee2e68b94558ef0ee6e9148a7ffdad50b03d +size 4319122 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e35bc0be1b3ac04dd268c76e13247f68dc173847 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c413fa6f46827408bd899bd778353d07619752ba4fd5e889931bf7ec74be91eb +size 4454670 diff --git a/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9f0392af71aea9160403e46544e4b0b92b264dd8 --- /dev/null +++ b/web-llm-models/v0_2_39/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84eb4eb2eff80c5c910ab9f1f4c1cda343cf6e513eba250a2c1056206e787b5 +size 4319187 diff --git a/web-llm-models/v0_2_39/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..771f4f1d662276585df5f00c48e4ca1c45fa93c5 --- /dev/null +++ b/web-llm-models/v0_2_39/gemma-2b-it-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816521b78414ed6427757581e61a4277471c61748839f690190bb7ccc797526b +size 3743549 diff --git a/web-llm-models/v0_2_39/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..17a91116131e1e2ef1a43c7058dc1e6932205641 --- /dev/null +++ b/web-llm-models/v0_2_39/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6280974575432a38d9cf97942256e77af6e44f7d467c9097c9e9e988e0c5b48d +size 3743548 diff --git a/web-llm-models/v0_2_39/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5521f4ee4af6ea77c0b7ee1c7acd4215ac2f2e65 --- /dev/null +++ b/web-llm-models/v0_2_39/gemma-2b-it-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8abd52edfa27cc39ba44a28e4506a9bb86641cc88a8f62f02a520abce9fb917 +size 3681000 diff --git a/web-llm-models/v0_2_39/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..78aea05487e96326697ae68b8f8ca125806047fa --- /dev/null +++ b/web-llm-models/v0_2_39/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079908afb27dafa5a08af2e7adb299dcd9609e4616fba19cc8c75bb1e7ea5fcf +size 3680994 diff --git a/web-llm-models/v0_2_39/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f5b857fbe0c3e96879ae9c09e74dcbb47816cc78 --- /dev/null +++ b/web-llm-models/v0_2_39/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77cdce72a601fa7d03afe614f2d9c770f70d8bc4a216d20f5c775ad1acfd4763 +size 4012678 diff --git a/web-llm-models/v0_2_39/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..35797cd6efde476aaa49ecca9ae24176e24ff9e8 --- /dev/null +++ b/web-llm-models/v0_2_39/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b3ac2a244d0744dbfac9c83af2bddcda9d61123244366541307fb19f4416ba +size 3645538 diff --git a/web-llm-models/v0_2_39/phi-1_5-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-1_5-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..edcc2aa4a915f236d0814b40fcf5c6ece6801a16 --- /dev/null +++ b/web-llm-models/v0_2_39/phi-1_5-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddfac22614f2a05206c8bb07e4abc8239e6e4e4c52534abff105f69bcc6776f +size 4061199 diff --git a/web-llm-models/v0_2_39/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..44424852b9dda3cc2db81889ddac952eda0cc6eb --- /dev/null +++ b/web-llm-models/v0_2_39/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f641f4c7e226760ade454f9207e15696187d24eb939e6ee5d8957adb07c6ce0c +size 4061195 diff --git a/web-llm-models/v0_2_39/phi-1_5-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-1_5-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..68efe9cb47d11cfc654b1392d0231b9be50c2729 --- /dev/null +++ b/web-llm-models/v0_2_39/phi-1_5-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b89548a3d3a1991594f06fbb5af7171881983095e27963726803530bf35c8f +size 4043163 diff --git a/web-llm-models/v0_2_39/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8924fe1560b721ffa8cb0bcc1d3d3f51027ec209 --- /dev/null +++ b/web-llm-models/v0_2_39/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70786f735a049ea5024f52381b1faa108d4bfa88d1318a3ab76a82a3b443e253 +size 4043138 diff --git a/web-llm-models/v0_2_39/phi-2-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-2-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..45d5760e1ddb3857b02bde343cf6019a7866d586 --- /dev/null +++ b/web-llm-models/v0_2_39/phi-2-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da245443a201217348d223f5b4cbb3c41e0da077e48c6605092c125f43fef7b1 +size 4207378 diff --git a/web-llm-models/v0_2_39/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3d5a9dbd6a8ebcf99c991e5b60b996d0871abfcb --- /dev/null +++ b/web-llm-models/v0_2_39/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1320c2c38cf9302fe93541bb7fff19bddaa0b5506533f46ad0864e32bd1cc38d +size 4207703 diff --git a/web-llm-models/v0_2_39/phi-2-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-2-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3afec40e9ae59c4248c53ab513b7a9b4006fd069 --- /dev/null +++ b/web-llm-models/v0_2_39/phi-2-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675c3adf80a0a9fa760155a66020a3aeb8d029de95e3a8fbc1b79ab14370a9cb +size 4202756 diff --git a/web-llm-models/v0_2_39/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f13c1554ceec76933263c62e1e389238700d01ee --- /dev/null +++ b/web-llm-models/v0_2_39/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc13629294b96dae99aab75be5611a10b846ebb97e1b585e6cf6bcc5b24334c +size 4203079 diff --git a/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f16_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f16_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8210ad44588256dea197a8921ce238ca6c0a8e6d --- /dev/null +++ b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f16_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160631a2152e8de062ccc4f528cc9847433b049c450c2798fafb79b835fb13e1 +size 4025121 diff --git a/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..169dc1cc9b2df3b665decc4f88ced3e44d89bcac --- /dev/null +++ b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b046f6bbe45f900402ef8f2641f3cc3ec8abe0be1af64adb6c6ff7b3bbb0b225 +size 4025072 diff --git a/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f32_1-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f32_1-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b7ca0510d9ff912dbfa46817f8aeb3d9f718167e --- /dev/null +++ b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f32_1-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a1c53b44c71fcb4ea3f04c39a75b70725a8965098f6b3da4e74b07c4e68552b +size 4005265 diff --git a/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a36f78745bbb0577a9905f43574c312f8ec0734c --- /dev/null +++ b/web-llm-models/v0_2_39/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f6c5f5cb998832bc5d54eecec8b5823c85d418f4bb670eb703bb3f8fa62f703 +size 4005563 diff --git a/web-llm-models/v0_2_43/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2e157dedef74024dc94f5234afdf0fbae9756555 --- /dev/null +++ b/web-llm-models/v0_2_43/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f73bdd656106ae8c69dff9834937b45498ffd152f5f99e500b6711d1488076 +size 5433260 diff --git a/web-llm-models/v0_2_43/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3b5a298b2e93576d177f7875c9543c1432575747 --- /dev/null +++ b/web-llm-models/v0_2_43/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6c22c5d3d168df9a8c451e7275610c412fc36d25c0eab7d2b639e22c8af08f +size 5000506 diff --git a/web-llm-models/v0_2_43/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5e2d70456b258847eb7ff756ab98ddcbb173f075 --- /dev/null +++ b/web-llm-models/v0_2_43/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e89c04a84dc7f69d16afc0806bc6b30df8662eec5337817bff8fbb473539b95f +size 4797480 diff --git a/web-llm-models/v0_2_43/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a7552e8aee836eaea1182368e5f3ea0863b8dd81 --- /dev/null +++ b/web-llm-models/v0_2_43/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0e03fd4e593f76a55d27505fa3e8eb2d203fc2763d2447d33039e17fdc197e +size 7452608 diff --git a/web-llm-models/v0_2_43/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..fa5ed5bc31c9a2d10a68bcfa047da44cc6b7b075 --- /dev/null +++ b/web-llm-models/v0_2_43/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf8556eefc27861c59bfabb07695826a72d71a21ba86b921b56c83247814255 +size 5029165 diff --git a/web-llm-models/v0_2_43/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2143620626aa19ff483dc4e1351fa6f229e8822e --- /dev/null +++ b/web-llm-models/v0_2_43/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9528f2cb0136ba8730a9e567a79525c238ee217b6b4ffdd905c739a36913a9f4 +size 4826023 diff --git a/web-llm-models/v0_2_43/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9338cd7e0bcfec3f8448f1c64edb80d98c81e922 --- /dev/null +++ b/web-llm-models/v0_2_43/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:982b847843ce7f5cabf84b4290abbd71a0890755c73c600986a45450b1eac83c +size 4179314 diff --git a/web-llm-models/v0_2_43/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1b48de5ad8dc47cf3e50bc7571d512098f9b9b27 --- /dev/null +++ b/web-llm-models/v0_2_43/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f256e2b9c9d9e091515fe690143be48ca1ee38cf76341ff0cecd66e0196e5176 +size 4060467 diff --git a/web-llm-models/v0_2_43/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..142a36d01211ff72190f463ee542532b6ef16b39 --- /dev/null +++ b/web-llm-models/v0_2_43/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48357208644936cd4994c5940f745b0bf2b30ad3713047abc2281ff00d22a6e +size 4168003 diff --git a/web-llm-models/v0_2_43/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..991448bc101c24c8b55bda60ca2a3a98788c6c5f --- /dev/null +++ b/web-llm-models/v0_2_43/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6f331b68e5aafad79fac9c4a8bf976b43ddc831b6a48db449adcfc1723ce27 +size 4073691 diff --git a/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ff2a88b8d0a89fb8d417970f6dd9e354c37546ab --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e104199bd87dbb7ecf6e5a0f8a01168e53ab9d24be0a097b4ee6419d2f952578 +size 3722336 diff --git a/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..53b6a254bf44adc1e5f82ff171dcc2861b9fbff1 --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f074436e84a8c343143858d6dccb2bdf780b66e217a7a35f1f054506bc014707 +size 3694380 diff --git a/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ea0db1e7bc9c11ffe08d96a8fe01eb01378f003d --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:facd990bc4d0e06bbb41ab6cd559f15ec10f82b211e8b5ebfe5b10a09713b32a +size 3766468 diff --git a/web-llm-models/v0_2_43/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c88a1b76f86ea6dcb01d7aab236599b0a91eeaab --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2f099e3555402934023b07fc88e87d473b08f4678b574d186ea8377ad20c9f +size 4090812 diff --git a/web-llm-models/v0_2_43/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7d45b42ce6e0966068b09052415ff334f4f19a56 --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe8c30e6d9754d55da8e3abde20705188492878758a382e2e551d28b7d8ccf9 +size 3991708 diff --git a/web-llm-models/v0_2_43/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..143fd14e1dc96e8fe9ebae079d7499f87b48baf6 --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21eceea070aee09ecc7f7f689d289b6653718f876c55258e6745443f0be641cb +size 4201944 diff --git a/web-llm-models/v0_2_43/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0b65e68efe3d16b2bf7d7c7b02e5c337e07a9d8f --- /dev/null +++ b/web-llm-models/v0_2_43/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a98db01ffb0595a5470a8f4fc3923c3633f117af781d689db75b872fc0567f +size 4094655 diff --git a/web-llm-models/v0_2_43/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..fd50c19c590022b52eb24b6bda00ced6fb79912b --- /dev/null +++ b/web-llm-models/v0_2_43/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10db6395572ca69eabe561e39c9842d3a70a342af9e28562c9953d91a7280096 +size 4447330 diff --git a/web-llm-models/v0_2_43/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e056ae3fdcbb4b8d05cd888304d40eda55c2a35b --- /dev/null +++ b/web-llm-models/v0_2_43/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2009739c5af49b4440dcacc38a64eb50b4883230ab6154ced1702b78691429a +size 4427765 diff --git a/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..fe916c139d65e75676a1439df288cee52c4d5a09 --- /dev/null +++ b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30565323af46790c9a03c95ba51d84ac2e57ba2f64653f020121b2b24c712e46 +size 4298066 diff --git a/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..38fb84831fdf1f0f38565054e5eb5646cad2fab2 --- /dev/null +++ b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50418833d5064017f6c4f3e09a59a6345fe39bcb8e3205acd62d8f6ae187316 +size 4169435 diff --git a/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c8b04978d93e209aa18686ee851d2aecf09872ce --- /dev/null +++ b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb079d893cc3be039470a8e04ebb72a14d0bf686d4753942e2238c405c72db01 +size 4519909 diff --git a/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2d05041e41fa9ed1af69893a011c9f7f13872433 --- /dev/null +++ b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af12b965f2541522b4b66082255e0a95fe74380f571f26a9ab42673ab01e375a +size 4376946 diff --git a/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..94b9554e0040b8983277828b620c4b18c9a58972 --- /dev/null +++ b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b230809caa4d409850c073cf0b9ea7375d74739a01f68fd84fdfaee45b5a008 +size 4520205 diff --git a/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b7760437e99e2de8acf971601fb94ece37791c2c --- /dev/null +++ b/web-llm-models/v0_2_43/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afcf801c5f3ef67e31af0c6389bd333edfbc0a7ed2b947a8b1de010378631f88 +size 4376940 diff --git a/web-llm-models/v0_2_43/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e6319507177d319fc265284c374aafcacdebc609 --- /dev/null +++ b/web-llm-models/v0_2_43/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2276a231bedb9b1aa295b2581afab713dcaa83355b2a46a91fda8e1196bbb357 +size 3799920 diff --git a/web-llm-models/v0_2_43/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8eef279b6b458410d4afb8f3b94dda06697e27af --- /dev/null +++ b/web-llm-models/v0_2_43/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6bdd1c529d7294afb8d4d99b305a08563ca46eae3bc6963bf0b434f9359a0bc +size 3735713 diff --git a/web-llm-models/v0_2_43/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b2c1c60fc238397a0909b4d6c585cdfcac0e1858 --- /dev/null +++ b/web-llm-models/v0_2_43/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:869dfa6740d3d5481f8bd50828576a352dc6f3e8e0608eb9cb4b126457ac5449 +size 4074429 diff --git a/web-llm-models/v0_2_43/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2ac60f05e64eb9d316abaaae3218c17b8e5eadd2 --- /dev/null +++ b/web-llm-models/v0_2_43/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b173b311d93b7f3b95a09bbc93bd266115ce3367354f05e442f42df83e9b897 +size 3709921 diff --git a/web-llm-models/v0_2_43/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e4a264b0c5cee3adc3f82c93f0916e4912137ea9 --- /dev/null +++ b/web-llm-models/v0_2_43/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934d6c77f617f1773006e7bb6544f22dda60e7aee529f3a9c129da0bfa6d3c8d +size 4119980 diff --git a/web-llm-models/v0_2_43/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5240b77dd9a1e068ed5d6aca3f1d4f404e991ea3 --- /dev/null +++ b/web-llm-models/v0_2_43/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fae92f57acee4d845cbdf5926cf615fa973b8c3823673e8a5dc991fac3f62d7 +size 4097122 diff --git a/web-llm-models/v0_2_43/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7cab39cf983d4803013386ee87b417fe9a24f161 --- /dev/null +++ b/web-llm-models/v0_2_43/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc3c73c0ad08958047cd024eed5544b96f94d2e84c75578abd718cacfca6c8a +size 4262392 diff --git a/web-llm-models/v0_2_43/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c5c52a80bd8eac4e10475ed42b01fc74457f16ae --- /dev/null +++ b/web-llm-models/v0_2_43/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60090bd9a42c43756c837004dcc73123a3b0c6c5f05c28226879b66338943aef +size 4257306 diff --git a/web-llm-models/v0_2_43/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7bf929dafb3d48b5f38021b747cf7eccbada1fa2 --- /dev/null +++ b/web-llm-models/v0_2_43/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065afb2675a1eb68a96dfbe9aed95f2b3f1f3b1930120d6602a6c1d95929a4e3 +size 4082420 diff --git a/web-llm-models/v0_2_43/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_43/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..be3b08fce1e9a61384567f0771377c71b3a06b43 --- /dev/null +++ b/web-llm-models/v0_2_43/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c91bf4ea2a515d91baea4802801038406e26df95dd25b93ca63d7652274a22 +size 4058029 diff --git a/web-llm-models/v0_2_48/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0e7677063c8c2d7b2a5f2aa7f84c27fcf4ecc68f --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bb93acfaf8c516f157d3e4cd76c7988adf08ed4a5940c9216dd37685d1ba3df +size 5441125 diff --git a/web-llm-models/v0_2_48/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..6a7ad410ca6240763a5a32c894f6f25710792330 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701f90b65725ca5a25005b23110b2d670a5af4fb0668b1953d59943eee3b3159 +size 5008373 diff --git a/web-llm-models/v0_2_48/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2db4091525e45ab86a866fe1f87e22b1c0934d33 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2136f456421e1ec8cafa9a38e80e62a74103c2d10fb818b3cfa845b227fa1bf +size 4805049 diff --git a/web-llm-models/v0_2_48/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..de32ede2f6ae15b0b145014443738ba4071f7e5c --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56d3b8384cff894e5408adb71a0805b3ae51d8688165c59981f1b8d8abb0418 +size 7460475 diff --git a/web-llm-models/v0_2_48/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..4802231a6c60b1743f80a80c5a25da5285d82f91 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00ac2128e3dec5f501fe2b131c69b5ced92a7bf032775032ef838a7fffd6f87 +size 5037019 diff --git a/web-llm-models/v0_2_48/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..95ad266d2b265ac41c37cf7018c1d735937e1657 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a8dce5a5683ccdae8d9c0d6026b0ae7fc4c9bff67dc6010dfcb9a2f1e97214 +size 4833893 diff --git a/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..bd8e51f8262a97bb46e8a7367c7b07194b76cf37 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f139463d99dce9a31360d21915a887a3fa7d1db7ea4430d3e59bd7a6ddce77b7 +size 4113319 diff --git a/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1e0df284c0459cbdcae9b53e6f976b9cba9f6faa --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a02bf49702dd2347de4637f5a31a295c9aa557cb90583302942bf5ce0405a0a +size 4027038 diff --git a/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a551668712ee27239b35443a6e3b7a12cb5624e9 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c576c81b33d192cf3038a32bca13bb086d8eb87b25ed9e38b8918ea54041e710 +size 4350548 diff --git a/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7367df55f3281c9636a7c68779b5d8efdeb81435 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867d98edf5d5880b1ff6f1492c96fa606c633942caf08ad355bc372cf9dc02d0 +size 4239396 diff --git a/web-llm-models/v0_2_48/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..bea37032848b5e8974d5466354082b1d499f6583 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e43933ad8a5783b1eb8d731ef891b266d37ad2e1f6a1fec1152e6a2c631d3d9 +size 4974252 diff --git a/web-llm-models/v0_2_48/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f4ab22ec8ab151a20bb308830bba42138a21cbad --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ffd88ce56137ba59e9a280588652915edb2c699e3ad8e281afb8e7407b7181c +size 4797890 diff --git a/web-llm-models/v0_2_48/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a7b77854ab2a7ed5a6d1bde55fc5e3d7701e957b --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d3817ce3bed09849d41505c4d29155dedd00f1fd90202c67fa5b2e60245e5c +size 7566203 diff --git a/web-llm-models/v0_2_48/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..983cc50f3bf3523bb56397461210c3301b1e7c47 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7bc08f187d6c7499a0b73cb50a5e87196274f1db20c00d20dcd23860d8d9c62 +size 5142829 diff --git a/web-llm-models/v0_2_48/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..6051a10c3d81498d1592b8b16ac052556c4415c8 --- /dev/null +++ b/web-llm-models/v0_2_48/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bcdaa523ecd5947b2bb3979616b1cdd7d8bd778b39dc31adf4b128605a41e0e +size 4889941 diff --git a/web-llm-models/v0_2_48/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f265b4b47dc18e007a6c706b313b9c1322bdbb04 --- /dev/null +++ b/web-llm-models/v0_2_48/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c522a069b373aa9335fb1d8ba2205f3186abfcf73b95f92f2e99006ca2ea9d +size 4187185 diff --git a/web-llm-models/v0_2_48/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..65b79311c25c694df9692a6fe8e45fe6c4b3448b --- /dev/null +++ b/web-llm-models/v0_2_48/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf061a1473d92056c6879f45da64781ece61999724f0f1f98942ead72e0cd62d +size 4068337 diff --git a/web-llm-models/v0_2_48/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..dcd1e902ab5e24fdc5b0b7dcec75755afcebb417 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c577bcdffd91f95c758a348d1c489bdcf5bd4e6982e7dcdafec86e778e430517 +size 4175678 diff --git a/web-llm-models/v0_2_48/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c4a0bc964df5ffe4f3f10c4ee2a96a943b9c9db5 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1483e5aa8ab555c9706481619a1189f65929a839277bf345bc16d3cce809d92 +size 4082170 diff --git a/web-llm-models/v0_2_48/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..dc4803a04f1c97328d39a4ea8bad6019dfd5e1da --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2bf991d39b1de9e33cd1edbaee60093e5233036a20c01732e5c61e740912cc +size 4238667 diff --git a/web-llm-models/v0_2_48/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3451b87bbb41b3f7adb018fc6d137e4a86db1b65 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4349108e76e901035d34dfcc54e523c6d31f687f8b991e076d521a24178383 +size 4145804 diff --git a/web-llm-models/v0_2_48/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5ee152e33724924f07513f8c4165aab18c087179 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a690a71fc4fec54a44374f6c11eeeb1e819a2a7989e5fd7297d7e5f8e79375b2 +size 7207325 diff --git a/web-llm-models/v0_2_48/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c6a89c5d07f667cf74b76ad8f6cba3e0af8671be --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1066927a58ed0a62eb599375fd5efb28a501edcbba2f30eac8c3ff298c0afcea +size 7103355 diff --git a/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e531b275461e097724693814a07e4639e14355b1 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aca842b5179177641deb1ed06e820f32e1c48ac51642c746e3be129dd498dcd0 +size 4215096 diff --git a/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f16_1-webgpu.wasm b/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f16_1-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..20119a3c6a73d405ed3ca9e4d239f108d5f29fc6 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f16_1-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb51f1415b06b04bd556f48e617f0df24e33e07b28a55a279983275307fd0e1 +size 4279042 diff --git a/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3b676f5449ebb3c4fc594f29a2919e41cdaf19f5 --- /dev/null +++ b/web-llm-models/v0_2_48/Phi-4-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c7c625ef5fa1d13db0d92ad47791936088d7ddc7432c585bf0dfe7a34b5dd9 +size 4078906 diff --git a/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8286ebf2703959b75e913463cbebb7b24cff5238 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d260f011e86ac62ed6ea254912e521ebccb341e030a3fea26fd1de5c535661 +size 3730173 diff --git a/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..378946d9542943452922e9a08e67b15b243c012a --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b4c0c5c65fdd847ab16b1cad27f4bab15b30f0fbcc4bd69fb6ba19ff5f14c6 +size 3702215 diff --git a/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..101a7da4769ab33a0e2381fdda33f06f31d4d4b8 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeef8ad5c1e668b066a3edc2e7f5d48e78d0749c869d87c00270406d95537c63 +size 3762958 diff --git a/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a92ec2e5f9dc0ad513f6d377edaf097361031903 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:338ab000a62274cb47fa0696aa244d4b1d73db4e6f144b429915d1cfe44d2e6a +size 3735773 diff --git a/web-llm-models/v0_2_48/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a86ae36b998bfbca04af6d925bb2a68d1a92b0a9 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ef8ff95b20cc099df70d365babd18dc8023936eeacc2f459bac21e0a4f9dfa +size 4098672 diff --git a/web-llm-models/v0_2_48/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0095e6bd240d895c9c692ab0825210de71827635 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75113c4eda9b941f853180dce38911311b0ba9053ab54e0d3f38ccc4b765a8ac +size 3999571 diff --git a/web-llm-models/v0_2_48/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a4a37cd1d377400b3afdfbf356b97f73fd31c6a8 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4d494a8a50937491cc789d77fe3fcf0859dd8005cbf5603cc6c1a8efcc6227 +size 4210172 diff --git a/web-llm-models/v0_2_48/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7ccb2f4ed8cb9a9ccad10731390aec7380a1b67a --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0c834c52878c4a0821c3eda2a87e37cad61329f3cbef8cc47a76936bc8e2d1 +size 4102190 diff --git a/web-llm-models/v0_2_48/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..4f1300e0868fd5d2a04fc881cffb57ec1c1ae3f5 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e03e730253a84b6d8f375ebcff7ffd194fe9633aff4380c34ccbf53c626877e +size 4428606 diff --git a/web-llm-models/v0_2_48/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..be21653c53d7656025c3a4fb6d60b88420d12698 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:964c02308ab453460c20e79c90925d8637e3121a4cd916b3fdc384f8821ca019 +size 4313172 diff --git a/web-llm-models/v0_2_48/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b9da02e5095c5c9583ba30bb49b02cf49e34fd6d --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14f4ddc2df0e72d40258597403076c15ce6af4b8d2eb2ec38f6bbde7196589d1 +size 4516014 diff --git a/web-llm-models/v0_2_48/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b10534a663509f52ce607b95a93ec5c4f9a8bc4c --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55af838bf26f22733fc7ea13d3e40c096e2c22e8eb8ef46fe4641f2a0578961 +size 4423618 diff --git a/web-llm-models/v0_2_48/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ca342926d915db652a5f8221acc9e79ecea7a981 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecd8d800f8f1e3a95c3e9d63595c04458eae3d494c20b48fccee5d32019aa46 +size 4709480 diff --git a/web-llm-models/v0_2_48/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..eda31ceda34d75eb0a7cc8a72f61fafba387693c --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5053de74239ecc27d47fce0e8ec6fe53b8424570546c4558b2bf670570660638 +size 4593277 diff --git a/web-llm-models/v0_2_48/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1626d7d61f24df6a92d597ae01d39f05ab6ece90 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6407437acec628497086916f43ba7d796a73c0b2fa4777060e9899e6d8ffb0fb +size 4740005 diff --git a/web-llm-models/v0_2_48/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..35efef01de960d86d076d00389c5768b7c0f5c7d --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a791bd73fd6f13e8b277f24ba934dcd273c8171f0f100a5ea468acf1ff2e9bbe +size 4618837 diff --git a/web-llm-models/v0_2_48/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..57136337c2fa77943e96a63928b049d3b083ddb5 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ce32a8169dc562b07c0dbba3bef5bc5bd114f32c7802ebf3abb3f89955b401 +size 5025851 diff --git a/web-llm-models/v0_2_48/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0817c26c29e706fe6fe77b1782bc423e544e5c91 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f956f37115fab63cd6020b14f2f113e1d94824541a5baecd25d45aaecb76e7aa +size 4882411 diff --git a/web-llm-models/v0_2_48/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..781a60f5b9671e88091068fe4e870e361974eaf0 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bfc549989b3beb2863cf3b97e0030c635c10518aebf3e27ff172dea0f06d8bd +size 5035160 diff --git a/web-llm-models/v0_2_48/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..98d4adfd7ea84640dc0c9fbde74dc93c8eacbe71 --- /dev/null +++ b/web-llm-models/v0_2_48/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c1c161b0741da8e4c70d15b7aea48d2ae246782c02cc430f74b900dc46abac +size 4886006 diff --git a/web-llm-models/v0_2_48/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a5207c99ba20e8ea4c933d11bd545ab638d1d7e0 --- /dev/null +++ b/web-llm-models/v0_2_48/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3c9fdb9826d82d54375fe684e63413a79273d888ec39e99768fd983306d078 +size 4455772 diff --git a/web-llm-models/v0_2_48/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..01bf90e85823e8126e90ea4efb7c0359e8cac899 --- /dev/null +++ b/web-llm-models/v0_2_48/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31550aa58367413c5806bdaf0591f90389b178f23f48b923d261378e2a36685 +size 4435507 diff --git a/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..22281b5fa6f75552e06a5895da5ad0ce284d7648 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1cbffc3d17fad2e9113898675442af4ce0390fb63247eb4aa93172698705c8 +size 4379038 diff --git a/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..49473fa9e5a8433ebb073a6c0d364c98e72af13d --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74c7b902895d99b7c62ebd26f92aef25bdad11536976221eecbeb9d42fda0ffe +size 4249278 diff --git a/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f8ea4a2e55373da58e58dd5552132c83c946f6fa --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fef2375047e0020f90e652f455a8a618e8ac1942fbe7c5e1914681fc2bb6850 +size 4613108 diff --git a/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7ae7c4663e8e87fa081deb047a0cfcad1a85e5f7 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-1.7B-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2995805ba4ba10421ca6c961bbafad6de1a8687cf1777a02bdd4cc98ae87951e +size 4459583 diff --git a/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1b33b337f2852ffd7f44bbe2f5c6fa462b92f8f7 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b78e92a25407b194b60634bef93349f33a9f09e3a7b6b9bddb873d2a79e90c +size 4345157 diff --git a/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f7a1cef5f764841a9d1108845876e2aed935362d --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33cd470d240deafe7639d56346787fd1ee49fef3ffdd2f272e00edc8622055c2 +size 4317628 diff --git a/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..08a659988e831ff2da7eaadb1b101ffc52b5a9c8 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd963f4c115dcec0cc1ae076740b218641cb4a75d7b18d20dd588ed0a01db259 +size 4619105 diff --git a/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c51dba6cb4b090b22ded778a75d2ac4297e3a64c --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-135M-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62c0701faa7dde70fc205a03a9087fb3b4a07344e6b9c2d29c0e7670ebb8e6c +size 4591518 diff --git a/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..28eb7d97959973c2a2007373e68d93d4f0068fef --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4315756c2b7410187a0fa9dc9de5ae101ee171dce93fb4e8e4609989795b673 +size 4466304 diff --git a/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b504082538d29fc0be3040b344f0bb083f88af41 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:238728e370c37e809644925435d5aed52d27268fb27891f30d7a7cdd89c12289 +size 4438025 diff --git a/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..30cb7fce3d64958622bb83427fd5404029b5f514 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c1d03509f73cd33543ea0f12f564af352de6b2df34ec9fce55bd3fcb121df9 +size 4658316 diff --git a/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0fa4c6107d7514939f4a7abcb50ae235bc9a28d6 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM-360M-Instruct-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237b745f96fabd8b159c7e7cdf202c1b86aade21d7facd35c86e700ba25017b8 +size 4630288 diff --git a/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b0723969213cf5ffd2125b76da108154d81f4ebb --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72460f1d7a974d126bce8ccea5116653c7a0aea0d44c4da1560a8686aedf57f1 +size 4431160 diff --git a/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..984313c30f7f3e3928d32f85864c85b90f5b0a15 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221370b0e9091aa2aeea45aac661871159aa6c572376f1f37ea270bb2899aea9 +size 4718828 diff --git a/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..81819fd074249dea14514897025bd236ce6653c3 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66a8c65afc65b99b66653f5138191dbb4a52052f15c1cdb2fb55893c3539b36 +size 4569717 diff --git a/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f93c318fdbfd13820c56b17ed6aa25fc5da33309 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16229b248a58207977adac68d3ad680d8cfa1cb481d79dc1ed319df82a6650b +size 4401699 diff --git a/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..17c0d1b01b2295dda6ff3cd7fdf2df718adb2586 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291ae8f3bc2823604628a5261fb43ce76e6fc9438d0b0b8cbc6659826e18ba53 +size 4377060 diff --git a/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..43b6a374feb387a875e6eb6ea39ae35945ffe4ef --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be09a5c94403a49e6e37b65c13797279bdf85bf2ade1c418fc3536ae0d576ef6 +size 4719758 diff --git a/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3147012f9288253a5b39b907f8d6a435e1cb3797 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab725c5700355948048e9f4455f4c6f01e693d587c56bd3f9350afba15d17368 +size 4695234 diff --git a/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..97db6dd058c9dda885419045b6b30e37bdebf78b --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1fac5a6d187c2693559295aeab8ca569bc08af5d476088c0a85c394aa98aa1b +size 4523147 diff --git a/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b2ba637eab48eda41b7ed3d3f0211cf06bd66e0f --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d9b4583777d5d2d1966b9feb8887395f735bbecf09f6623d7a8d6bdbd9ea239 +size 4497934 diff --git a/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..eca8a4df7f007c66fde73c4f767a5ae24429ea6e --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8e5ab8fed5a087e42b25a6301f30d5ed1336ba668d6325e528f83bd7cf2bbb +size 4753674 diff --git a/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..250cf0d61d4ccc94748d70dad0bee936511a2859 --- /dev/null +++ b/web-llm-models/v0_2_48/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9488bc675d83d38604c6f289c0c6b813b827d6882455406cd355f2212036dba5 +size 4728519 diff --git a/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..abeb73e6859b09626e1900b2f9037fd63310fcc1 --- /dev/null +++ b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faec533c564b081b8271f0e58f4e0c3bc327f1e1859f730cee0572f63808d1c1 +size 4306031 diff --git a/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..cb6e4a9c08eca66d2517fadeb98f71278aa50b1c --- /dev/null +++ b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc767708eee8eb765b06f1fc359e3e13021f1b8259ca8d4d07832974f7943c16 +size 4176989 diff --git a/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c76020a27f7202ee45d37c8d86a7ea6b20fd73c8 --- /dev/null +++ b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff2f1a3f5be8f387017c739fd5835ab043b38047d93b6b15c34c7cc4709ed05 +size 4528017 diff --git a/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ebe4740a971c6646c24fa2dd4148b2eed16351cf --- /dev/null +++ b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b682324a61d4d41ca4be06978c7b8b414c7176adb9d80d555a778a87cd6e4209 +size 4384748 diff --git a/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..70cb7e255d74c7df2df970560c6e7668bea31c5b --- /dev/null +++ b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8da8b23bcf2a99fef8769c5f4d3765c03f22cf035e36b266b367a1ed88913e +size 4528009 diff --git a/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7f51448d690ab86e4355c4d874d17cf901555327 --- /dev/null +++ b/web-llm-models/v0_2_48/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df67bf715977bd371cfcb9779692a7b58362c4756be83551729a5cfdf7622b1a +size 4384696 diff --git a/web-llm-models/v0_2_48/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..72d996e90248ec78dadfbd068ec266a0af808074 --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c0ce8675d1dc022e1ed274e2201c5e652f470d29dee8b9dc1eb4a3f4e42739e +size 4101995 diff --git a/web-llm-models/v0_2_48/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9c32d18492379e291eb62a3d2fece41e9bcd3d4e --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65064001a0018490fb82a4bba4e21771983c467680591f1f3303d8183c1ab648 +size 4079370 diff --git a/web-llm-models/v0_2_48/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1979434f5e870bdaf1e781d4726f3c4ff3e59e73 --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a107fe91ca846a23c0784ce70e257995807b885ef0a9eee189222c233c54dc1 +size 4217336 diff --git a/web-llm-models/v0_2_48/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..84e0871877c5d6b6712d6bc4de71cd9df48f875e --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313ced053382440f5fcd4e370fdd65b3274162b8b588ed22e8c5427f8f0ba362 +size 4191329 diff --git a/web-llm-models/v0_2_48/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5bd2db88b0bf960be3c03d6178c9ae8ba4d967b5 --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1633844c715a01d75c62ef6bb2f8163c8b679a50a30d5830acec32748fc0d2 +size 4648656 diff --git a/web-llm-models/v0_2_48/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1084816855a5915f30490ec0e465bd0ca76a7ea9 --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8875aec7c1928b39f857be344ec99604f873226d835ad7b266d58241b57633f +size 4607551 diff --git a/web-llm-models/v0_2_48/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..88f0b94555092b33109593dff2d6fc0358b73b7a --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b2d2b7ee77a838d012138fd8d0bdccdc44780f88557deba15455a832a2dd193 +size 3807774 diff --git a/web-llm-models/v0_2_48/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..effb751eb977e01fed9a0a64ace1dd5c1ab5c344 --- /dev/null +++ b/web-llm-models/v0_2_48/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5bb97a54051e17d3a11f266767f022c2893d60cf5a3fba8227939cbab0c0cec +size 3743577 diff --git a/web-llm-models/v0_2_48/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..340f9249a205bb77cff76f3fbe29d8d5a1317e9a --- /dev/null +++ b/web-llm-models/v0_2_48/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b6ab20d81f26b8ef87f50f3e1290fa61c0197a0cc07489363832317418df29 +size 4082248 diff --git a/web-llm-models/v0_2_48/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8d344aaedc15491b3d7b6031829c02108eac3435 --- /dev/null +++ b/web-llm-models/v0_2_48/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:064b48f8adcf2368cbe30c07d3f21e74f1007445c5d4010c975ab9c47610cfaa +size 3717730 diff --git a/web-llm-models/v0_2_48/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0cc51d1a5d799ce06dc0454d9e1400c02c70701f --- /dev/null +++ b/web-llm-models/v0_2_48/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f84ae8f29eb9a589ee73fccf64955d474289e9c880d7ec134584479742d6722 +size 4127547 diff --git a/web-llm-models/v0_2_48/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..5d0f994c296c8faf871cde1598f5d36b25545894 --- /dev/null +++ b/web-llm-models/v0_2_48/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20eb892c4ce98d666db98f1c61812f7120101529fc8b685b87758fc1fddcb64 +size 4104933 diff --git a/web-llm-models/v0_2_48/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..8566471d66cb0489cc9ac6704159665825456a96 --- /dev/null +++ b/web-llm-models/v0_2_48/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f218e1ba54cc01e9a6ee2aea9f26759d72c5cc841f73f51e8eb3cc6f48aa1e27 +size 4270177 diff --git a/web-llm-models/v0_2_48/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..16ce90ebe2821e0926080c27ec6e9e10e582bfa0 --- /dev/null +++ b/web-llm-models/v0_2_48/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70df36d6824f4c9d4bf4e477978d938b597ce510667fe01452e018105f28eb01 +size 4265668 diff --git a/web-llm-models/v0_2_48/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm b/web-llm-models/v0_2_48/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..34e3d603c169abb4887509303276e5ae230f3243 --- /dev/null +++ b/web-llm-models/v0_2_48/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610044ad036a542fe8e8bd71bf4171b145ef10689f4e1c4acb01c3e215fe517c +size 2995385 diff --git a/web-llm-models/v0_2_48/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm b/web-llm-models/v0_2_48/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ff8c5c0b9f06476b6ad78088a218a9eb0e02239b --- /dev/null +++ b/web-llm-models/v0_2_48/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad787fe6a88dc354698be0e4a73d43d860d635aed5695a6b84fee850dc5e7f9 +size 2995379 diff --git a/web-llm-models/v0_2_48/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm b/web-llm-models/v0_2_48/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..6730310e77b4564db2eaea29a7f7610580bd6d16 --- /dev/null +++ b/web-llm-models/v0_2_48/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe2353fe51bca4e775b47fba37aec86d08e0081b23a24e5bde18ff84f0e6b31 +size 2967692 diff --git a/web-llm-models/v0_2_48/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm b/web-llm-models/v0_2_48/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..11870a68edf99ddf973b27caa0a915134c110aa4 --- /dev/null +++ b/web-llm-models/v0_2_48/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:480ea71b15f985a7800e21709d247070b349aa0ba0880c42b9535b859ce19ca1 +size 2967695 diff --git a/web-llm-models/v0_2_48/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..50d092143ae30f6a414b1d3adfa9bc2dc805fafe --- /dev/null +++ b/web-llm-models/v0_2_48/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f9f7172eaba12e033bb4efa15620a79c4993580e531ea47f83b72fecde00e11 +size 4090533 diff --git a/web-llm-models/v0_2_48/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_48/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..aa47699b9307f7bb47fa7b9de83a1dae3f276e6e --- /dev/null +++ b/web-llm-models/v0_2_48/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed290952632dfa46aef774cf0217dbf6e5ed5e023c8ed65704284c1787b90b0 +size 4065854 diff --git a/web-llm-models/v0_2_80/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..de9303f766f4e42e13902d5d130a35eb3ac132d2 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b4219693562cc5a3a198e017b83cb1e37a93c61529f925b1abd763566db28e5 +size 5867642 diff --git a/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ed0070f3467d105e22c003d23f9184c5b526d481 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16824420129661706fc37ab2682cee95b1b124b5f637918f9962dd255f826326 +size 5432524 diff --git a/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..279ab6662db07fc31888162e84db272a30ef5b10 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b932162e61f885f1dd93f1a19a7126af973be480f8a3f6ba1834e488a924b864 +size 5210961 diff --git a/web-llm-models/v0_2_80/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..594f9154b016841e414233b374bb0a35cec3d767 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830938512979859cd6164d8904b38e3d6e4ac625b0e05dcfbd179205e49297d6 +size 7894526 diff --git a/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..9b33e2cde49367faf382bf9b447cecf1fdf0e0fd --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d3461ad48a712a8e88c32d8dffa29e26db64fa30efd9d34fd06efdcf154a57 +size 5462970 diff --git a/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..433764ec52b931c23d55797aba69c312c4115d80 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35c7934353bbe5a03c9e7a4f1b717a4e60aa13ac7659f7b7a368ab5e427d26d +size 5241749 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b0f7038e95e60220d31d0fddb79c710110ef2077 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf1e920c3c5c23f63ca36490a533b4c5fad2cd88ac002b4c69f0201dab9194c +size 4418905 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..35a7f0a97a69d372f3017372b08389fa8a8574d8 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e085fcdbf451fd2e020a436f48f7a847e497603fdaed964eed2963998bbea81f +size 4325761 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..33af27b8dc72d26a536641abbdc1838cb39b3ee5 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d579738abb981f35847056680932aa4e10781a9fec2dfe21d220077293cdad +size 4657795 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d17ba5629f030f52c6676e5ed0a425fd5e0c806c --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be8362e40c748c484d7c342dec87f9efb4db13d0188ab8344bfa978a49df2cc +size 4540037 diff --git a/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..32485f0da00a25daa89c5ab3f0eb0902989a32bc --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7755fc12341fc983105e03f71a2170fcda7d93630efdd50a5c9b9e96f329e5 +size 5302431 diff --git a/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e0bd104994635f8bdcf0cb59d5dff06854516104 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91fb3d3e7dcd91f758d3e0babea20f8aef688fd6dae8ebd7e3ccad340f88a9f8 +size 5101685 diff --git a/web-llm-models/v0_2_80/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..abc3e047c394d40b9bfba40d04d16fb21489e07d --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d495540e8e391a84c3d1694c584dc1cc8686d57d268169dd91d1110baa4e952 +size 7903309 diff --git a/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c718040f28087717711e0161284d6f99b52b0059 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8718b5a459c6fe6e47aa9ac193a2bb605828cad3e710bb66f0e0f34418d4e57f +size 5471751 diff --git a/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..6d13c661f8a144b2eae6629660c757a6f96f9083 --- /dev/null +++ b/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed45f31f897dbe1d41ad117b35b73dbd7cbca1365d230ddaf3b8c2681a835604 +size 5248471 diff --git a/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..603006943c578859d11b07163964692aa6ffac7e --- /dev/null +++ b/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8babd2d77415bf663d4d708947c7db25680285932350a7f280c3cea3753abc5b +size 4615812 diff --git a/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..550b01a5b6d00d685895ec89902aa27ba6913ec3 --- /dev/null +++ b/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799d7fdf1888de1a90641c4a0896762d7a97a1f79623e2f84fd03c5d34867232 +size 4477233 diff --git a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-old-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-old-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7d1a43f5b97484dd91d78c85b34aeeae77a3bfb5 --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-old-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251539b950c50592842cbdc4685fa6e87a2d2f01020eb2398800107223a55457 +size 4621036 diff --git a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..7d1a43f5b97484dd91d78c85b34aeeae77a3bfb5 --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251539b950c50592842cbdc4685fa6e87a2d2f01020eb2398800107223a55457 +size 4621036 diff --git a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..dfc758b4428ddbe4886b9564f97e284ebf371336 --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88ba4ef7898f6ae3c5be4d8a029d665f380e1a5e2ea1447f7e0c4622d0e3f41 +size 4497612 diff --git a/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a06d6bfe1bf1891e2b47a5c526612e81a58a3371 --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2f7c0760b3ca2ad9055267aaa3ddc8989d57802362958223a49ac3fbc96aff +size 4626576 diff --git a/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..56951f252935772fa9078591faa6063f0ecf6bb6 --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f826e45c9955a692f0e9b96701337fac527f3a8d2e18caf4f9c5d068d057d05 +size 4502793 diff --git a/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3f78508ef9b728c414105ea062e8e93417bce6fb --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1827e7c9679f68eea59b6d2baef1fe9d42b9748678ee0bc393795c915d1816 +size 6146107 diff --git a/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..48e547dcf8694856ec5295bdced35522d9854d1a --- /dev/null +++ b/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d6c9d9fa9286ae0ebb692804ac6898294e251b537644994f9c6f78cf54ae4c +size 6009000 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..bcd5230901873ab825027786bb144162243564ed --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7043670804ddfe408ab96d83e5f5637c413aaf9e386cbd7d2ca6ded4e648179 +size 4088133 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..fbaafed73ac3a692a3e7ec3b5f643dfee21f21e1 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21bc66498f545b298a968a039979f7d1f6bde85f1653099fc0c0df3d00097300 +size 4058892 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..74ccfb2c85e6990f70e34874d0dd8cc30a85f580 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:627e26cb89b457ef02480912f147f8b7126f2e50cbcba6ac553aa1b142ae0822 +size 4133881 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-testtokenizer-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-testtokenizer-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..80fee093c9957ef811f29e2506e62e1ef5690cf8 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-testtokenizer-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee55eef3064f287287d87473301f51890991c998c91437387ed844bcbcf3b84 +size 4162181 diff --git a/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1e916273ea949499a1809712f1920b2a6287a333 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb9b4cf41ae2a87f0762df6a3e50a3b9f361fd0138316fa38f1986f7abedd26 +size 4541432 diff --git a/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c911e0fc59c6f7e9049bbb73e310b0e6a438b4f3 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f75a009bc20fe4f1ca47cc5b0983e4d8c946d1c51515e268e92bea421b8ca1c +size 4421335 diff --git a/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..00fd8e391eb96325d941e275c2d311065a23ad2c --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e30bd67251a3b4967ce5d7d738b121eddb543ed650cf5adf5bf1d80f9e205b3 +size 4656226 diff --git a/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0b4c9b2f871f25e61d32d1dc609ec67a1092116e --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d33e7b9963d1adbcb148327b0015c7d7099cdf50b3423b7fec469f494e4373 +size 4528253 diff --git a/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..49946c4f90e8b6fef5ed3a9966a85ec729ba188c --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:806c019a9e17987a18bd73380f38ad4ea2dfb686a2e088a8b7939ab139f02f07 +size 4761165 diff --git a/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..04f4cae95d31b6df6e7cef93ad640face92666a9 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bab183552e418d3a719372fa1813e4875133e5ea6e2c8053d5f63b8383031db +size 4619438 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f037e293181c6620bdbfea73c6939c47233bb50b --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3725b9724afacda54874e2bfe1723737cd006ef1283c20099437530625e5e4df +size 4728697 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..27399f5188283ba86a058852049234c20ffe4356 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b8e45c3af21d6d43e7816e2a0108dee260c426940b0f790dc3bc3d40c2b32e3 +size 4636240 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..02083b22c2384cc78b31b669b74c51af941322b2 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d785a162b3cbb2fded342e856e321fa5328ce9da5fa151fcba71e56024ad93 +size 4923843 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..482273074e11bf97ed4103c6597eb8e3f84ecebe --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292fa0e4e75fb9defe1c48254bce2795a990442529a086df19587d1db42b38b3 +size 4807405 diff --git a/web-llm-models/v0_2_80/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..4f789db8ef279e49b31257cfa29afd088b7a40db --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d8290e1b94c4b474e7126289cb7991a69ed2862952b32c0352403238bf9b01 +size 4954364 diff --git a/web-llm-models/v0_2_80/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3f3424521ff7294a78e67edffd8cd41aee9e77b9 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ceaace42da8820ca10a7be244cae90df761592dac766a5f3e38632254377ab0 +size 4832975 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..00ad4bfd68f1baff40f8642e816f046111745874 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9e9bef2e4e75abe8db6fb06189f908ea57935735473da6b7dcce93cadcb0f7 +size 5239948 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..49af8c2c2871c7a6f5e9f0fb420c01d8c4ea03d0 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04549118d7e45e724615a29fa893601b4f8a46399ec6c8dbb5504c2fb5e5ce82 +size 5096403 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..00ad4bfd68f1baff40f8642e816f046111745874 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9e9bef2e4e75abe8db6fb06189f908ea57935735473da6b7dcce93cadcb0f7 +size 5239948 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..49af8c2c2871c7a6f5e9f0fb420c01d8c4ea03d0 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04549118d7e45e724615a29fa893601b4f8a46399ec6c8dbb5504c2fb5e5ce82 +size 5096403 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..f9555c9974f65086d0b4584983935f43222db217 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341aafc07e222f37e8edc7d466d5780b195723e7a80eb58fcd46b7444a4a879d +size 5239948 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..23c98f6ad2f909698173af3dbd6b4624ae8ce6a2 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:874a8d0ca74d5d90eead4e5e6d6142b17316a211816d068d6c094f8b86f57f11 +size 5096403 diff --git a/web-llm-models/v0_2_80/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a2b02904dc3fa59b61767138604b1e5d1683d875 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5c0b053def967400622d893b438bdf62e74d16e6bd97aabb3c71ca5fefa850 +size 5249209 diff --git a/web-llm-models/v0_2_80/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..118a95a37f2d31e99c63508f16b11aadc2e55391 --- /dev/null +++ b/web-llm-models/v0_2_80/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4475d9accb042f807b4f5004584ebbca9abf5659c8ce7b2b4edd01e031347381 +size 5100016 diff --git a/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a0393d4ffa2a727ef06bf7c87a8de8db986f1156 --- /dev/null +++ b/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac8742d3ebfe8d73dee65b7f9ad028b9b3684429f372aee08498474a05f9e24 +size 4913981 diff --git a/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0b833b5299170f4428a92f0a617b44fc186678af --- /dev/null +++ b/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cff4ac94d9a1b51bda503f762b5fa1c1307ee851a1e5fdb8aadd7e225bc8e8f +size 4867021 diff --git a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..abe7da82a2d01a3853aa1823774323e92722cc62 --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b4280a39df222869a5a19ed5ea3400742243048b643c3e621df4aab04b07d3 +size 4737987 diff --git a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e5b8fe5dd1fccf9a0f1a62ff80ed8f57ec8bb85f --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6fc09134d32e16a47fd117eb6411c99488806a0bbf881874d58e5ff00dd5290 +size 5026864 diff --git a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..07b991ce2c32ed3f915364f6633d02db5891f64d --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bd275e0055d9f21be53dfb443dbcf7444b9d8d9d39eea1f5b96377c007bcc68 +size 4869922 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c2b599d9b95abd037baabf5596b14e0448aeb7cb --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3c6f201de25b20301562dd571fc8f2b859596df09a1b29535d0fe04702c322 +size 4703557 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e8b5fd70fddb14624aabef58b38893421ee26ab8 --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e792ea4dd15eb352775224490f31229ab805cd3f768cba339473d339ac916ef1 +size 4674751 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0766454192b18b12be734a64e1b3d4fd903f9d82 --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e3b4da928bcbc051335cbbac501e40eaae1cb4f2a4ab196cb1fffcceee3aa7 +size 5023498 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..506d7236417d93d71532ba35d34294430c6abe4e --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2892b3f4fd2fa672b3568a4995124c4331989e2f8d985af26071e3b34ee82801 +size 4994608 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b5cf1aa3cea574275758ffd116ed8cb1fb2cf4a2 --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0f50bebcd5b9b55d569cd9f605bc197e9a5e899ef80529dda705cc446541fe +size 4825417 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..06623902922ab5070db82858f9bb70a936082904 --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c5602d923eea8b6d4e19d65d0f5f932129a8b1ed2f1367d75f64f64ba580ea +size 4796086 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..c577792264f2f1e7a28533ca0c1630ae510d9f00 --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d07d1bb06ce2455da8a2aab9bce9a746cb56ed4177611a7a33141cae4b422a79 +size 5056973 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..00f204362feaa3a3257879116ec3f4f827a4b36b --- /dev/null +++ b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09434111064e168afc361d34925cbc776b108fa92d09b602f78517f417335804 +size 5027616 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..beb8f7085fe8454de22c68617d5392cb0a16be74 --- /dev/null +++ b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c075fd75e08b580a80d44ca63f45f0c9fc67313c25afdeff9e002901a141d0b +size 4665014 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..88dca71ad6f7b41c232edc1af3846e5daf517278 --- /dev/null +++ b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b9f19791b15bd7a9bf5da45338b91ee8c9025e2e0092a5d96f4f1ef9234724 +size 4533418 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d14c055b6476d44a15d895de28082b511c89f6b2 --- /dev/null +++ b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef51c2e76fc1bb5e055edf961b84af026f6626d13533eb13a914e6a1e640c970 +size 4938116 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1104b4fcc6f2305612ae040678adb6c4e8fe0504 --- /dev/null +++ b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a008cfbc8aea6047638edd32330c29e17eaf436c316e64c66050d85831f5074a +size 4791630 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d14c055b6476d44a15d895de28082b511c89f6b2 --- /dev/null +++ b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef51c2e76fc1bb5e055edf961b84af026f6626d13533eb13a914e6a1e640c970 +size 4938116 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..1104b4fcc6f2305612ae040678adb6c4e8fe0504 --- /dev/null +++ b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a008cfbc8aea6047638edd32330c29e17eaf436c316e64c66050d85831f5074a +size 4791630 diff --git a/web-llm-models/v0_2_80/compile_wasm.py b/web-llm-models/v0_2_80/compile_wasm.py new file mode 100644 index 0000000000000000000000000000000000000000..0467c01d9b2d7c9916a00e5f2dc598e3534b045b --- /dev/null +++ b/web-llm-models/v0_2_80/compile_wasm.py @@ -0,0 +1,274 @@ +import os +import subprocess +import sys +from pathlib import Path + +LOG_PATH = Path("./") / "compile_wasm_log.txt" +# NOTE(Harry): Set this to your binary-mlc-llm-libs repo. +BINARY_DIR = "/path/to/binary-mlc-llm-libs/web-llm-models/v0_2_80" + +# -1. Clean log file +cmd = [ + "rm", + "-rf", + "./compile_wasm_log.txt", +] +print(" ".join(cmd), flush=True) +subprocess.run(cmd, check=True, stderr=subprocess.STDOUT, env=os.environ) + + +def compile( + model, + quantization, + context_window_size, + prefill_chunk_size, + model_id, + use_sliding_window=False, + max_batch_size=None, +): + with LOG_PATH.open("a", encoding="utf-8") as log_file: + # 0. Clean temp folder + cmd = [ + "rm", + "-rf", + "dist/temp/", + ] + print(" ".join(cmd), flush=True) + subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) + + # 1. Gen config + cmd = [ + sys.executable, + "-m", + "mlc_llm", + "gen_config", + model, + "--output", + "dist/temp", + "--conv-template", + "LM", + "--quantization", + quantization, + "--prefill-chunk-size", + str(prefill_chunk_size), + ] + if use_sliding_window: + cmd += [ + "--sliding-window-size", + str(context_window_size), + ] + else: + cmd += [ + "--context-window-size", + str(context_window_size), + ] + if max_batch_size: + cmd += [ + "--max-batch-size", + str(max_batch_size), + ] + print(" ".join(cmd), flush=True) + subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) + + # 2. compile + + # 2.1. Get output wasm name + ctx = "" + if context_window_size == 4096: + ctx = "4k" + elif context_window_size == 2048: + ctx = "2k" + elif context_window_size == 1024: + ctx = "1k" + elif context_window_size == 512: + ctx = "512" + else: + raise RuntimeError(f"Unrecognized ctx: {ctx}") + + cs = "" + if prefill_chunk_size == 4096: + cs = "4k" + elif prefill_chunk_size == 2048: + cs = "2k" + elif prefill_chunk_size == 1024: + cs = "1k" + elif prefill_chunk_size == 512: + cs = "512" + else: + raise RuntimeError(f"Unrecognized cs: {cs}") + + # e.g. Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm + if use_sliding_window: + output_file_name = f"{model_id}-{quantization}-sw{ctx}_cs{cs}" + else: + output_file_name = f"{model_id}-{quantization}-ctx{ctx}_cs{cs}" + if max_batch_size: + output_file_name += f"_batch{max_batch_size}" + output_file_name += "-webgpu.wasm" + output_path = os.path.join(BINARY_DIR, output_file_name) + + # 2.2. Compile + cmd = [ + sys.executable, + "-m", + "mlc_llm", + "compile", + "dist/temp/mlc-chat-config.json", + "--device", + "webgpu", + "--output", + output_path, + ] + print(" ".join(cmd), flush=True) + subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) + + # 3. Clean temp mlc-chat-config.json + cmd = [ + "rm", + "-rf", + "dist/temp/mlc-chat-config.json", + ] + print(" ".join(cmd), flush=True) + subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) + + +# NOTE(Charlie): As of 03/31/2025, the context window size does not do anything because +# it has become a runtime thing in both MLC-LLM and WebLLM. + +# NOTE(Harry): To compile a wasm, uncomment the corresponding line below. + +# compile("phi-3", "q4f16_1", 4096, 1024, "Phi-3-mini-4k-instruct") +# compile("phi-3", "q4f16_1", 4096, 1024, "Phi-3-mini-4k-instruct-old") +# compile("phi-3", "q4f32_1", 4096, 1024, "Phi-3-mini-4k-instruct") + +# compile("llama3_8b", "q4f16_1", 4096, 1024, "Llama-3-8B-Instruct") +# compile("llama3_8b", "q4f32_1", 4096, 1024, "Llama-3-8B-Instruct") + +# compile("llama2_7b", "q4f16_1", 4096, 1024, "Llama-2-7b-chat-hf") +# compile("llama2_7b", "q4f32_1", 4096, 1024, "Llama-2-7b-chat-hf") + +# compile("llama2_13b", "q4f16_1", 4096, 1024, "Llama-2-13b-chat-hf") + +# compile("mistral_7b_v03", "q4f16_1", 4096, 1024, "Mistral-7B-Instruct-v0.3") +# compile("mistral_7b_v03", "q4f32_1", 4096, 1024, "Mistral-7B-Instruct-v0.3") + +# compile("redpajama_3b_v1", "q4f16_1", 2048, 1024, "RedPajama-INCITE-Chat-3B-v1") +# compile("redpajama_3b_v1", "q4f32_1", 2048, 1024, "RedPajama-INCITE-Chat-3B-v1") + +# compile("tinyllama_1b_chat_v0.4", "q0f16", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") +# compile("tinyllama_1b_chat_v0.4", "q0f32", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") +# compile("tinyllama_1b_chat_v0.4", "q4f16_1", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") +# compile("tinyllama_1b_chat_v0.4", "q4f32_1", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") + +# compile("tinyllama_1b_chat_v1.0", "q4f16_1", 2048, 1024, "TinyLlama-1.1B-Chat-v1.0") +# compile("tinyllama_1b_chat_v1.0", "q4f32_1", 2048, 1024, "TinyLlama-1.1B-Chat-v1.0") + +# compile("gemma_2b", "q4f16_1", 4096, 1024, "gemma-2b-it") +# compile("gemma_2b", "q4f32_1", 4096, 1024, "gemma-2b-it") + +# compile("gpt2_medium", "q0f16", 1024, 1024, "gpt2-medium") +# compile("gpt2", "q0f16", 1024, 1024, "gpt2") + +# compile("phi-1_5", "q4f16_1", 2048, 1024, "phi-1_5") +# compile("phi-1_5", "q4f32_1", 2048, 1024, "phi-1_5") + +# compile("phi-2", "q4f16_1", 2048, 1024, "phi-2") +# compile("phi-2", "q4f32_1", 2048, 1024, "phi-2") + +# compile("stablelm-2-zephyr-1_6b", "q4f16_1", 4096, 1024, "stablelm-2-zephyr-1_6b") +# compile("stablelm-2-zephyr-1_6b", "q4f32_1", 4096, 1024, "stablelm-2-zephyr-1_6b") + +# compile("qwen2_0_5b", "q4f16_1", 4096, 1024, "Qwen2-0.5B-Instruct") +# compile("qwen2_0_5b", "q4f32_1", 4096, 1024, "Qwen2-0.5B-Instruct") +# compile("qwen2_0_5b", "q0f16", 4096, 1024, "Qwen2-0.5B-Instruct") +# compile("qwen2_0_5b", "q0f32", 4096, 1024, "Qwen2-0.5B-Instruct") + +# compile("qwen2_1_5b", "q4f16_1", 4096, 1024, "Qwen2-1.5B-Instruct") +# compile("qwen2_1_5b", "q4f32_1", 4096, 1024, "Qwen2-1.5B-Instruct") + +# compile("qwen2.5_3b", "q4f16_1", 4096, 1024, "Qwen2.5-3B-Instruct") +# compile("qwen2.5_3b", "q4f32_1", 4096, 1024, "Qwen2.5-3B-Instruct") + +# compile("qwen2_7b", "q4f16_1", 4096, 1024, "Qwen2-7B-Instruct") +# compile("qwen2_7b", "q4f32_1", 4096, 1024, "Qwen2-7B-Instruct") + +# compile("llama3_70b", "q3f16_1", 4096, 1024, "Llama-3-70B-Instruct") + +# compile("llama3_1_8b", "q4f16_1", 4096, 1024, "Llama-3_1-8B-Instruct") +# compile("llama3_1_8b", "q4f32_1", 4096, 1024, "Llama-3_1-8B-Instruct") + +# compile("llama3_1_70b", "q3f16_1", 4096, 1024, "Llama-3_1-70B-Instruct") + +# compile("gemma2_2b", "q4f16_1", 4096, 1024, "gemma-2-2b-it") +# compile("gemma2_2b", "q4f32_1", 4096, 1024, "gemma-2-2b-it") + +# compile("gemma2_9b", "q4f16_1", 4096, 1024, "gemma-2-9b-it") +# compile("gemma2_9b", "q4f32_1", 4096, 1024, "gemma-2-9b-it") + +# # max_position_embeddings is set to be 512 here for embedding model; no rope is used +# compile( +# "snowflake-arctic-embed-m", "q0f32", 512, 512, "snowflake-arctic-embed-m", max_batch_size=32 +# ) +# compile("snowflake-arctic-embed-m", "q0f32", 512, 512, "snowflake-arctic-embed-m", max_batch_size=4) + +# compile( +# "snowflake-arctic-embed-s", "q0f32", 512, 512, "snowflake-arctic-embed-s", max_batch_size=32 +# ) +# compile("snowflake-arctic-embed-s", "q0f32", 512, 512, "snowflake-arctic-embed-s", max_batch_size=4) + +# # Cannot be shared with phi-3 because phi3.5 has rope scaling +# compile("phi-3_5", "q4f16_1", 4096, 1024, "Phi-3.5-mini-instruct") +# compile("phi-3_5", "q4f32_1", 4096, 1024, "Phi-3.5-mini-instruct") + +# compile("phi-3_5-vision", "q4f16_1", 4096, 2048, "Phi-3.5-vision-instruct") +# compile("phi-3_5-vision", "q4f32_1", 4096, 2048, "Phi-3.5-vision-instruct") + +# # Llama3.2 1B/3B +# compile("llama3_2_1b", "q0f16", 4096, 1024, "Llama-3.2-1B-Instruct") +# compile("llama3_2_1b", "q0f32", 4096, 1024, "Llama-3.2-1B-Instruct") +# compile("llama3_2_1b", "q4f16_1", 4096, 1024, "Llama-3.2-1B-Instruct") +# compile("llama3_2_1b", "q4f32_1", 4096, 1024, "Llama-3.2-1B-Instruct") + +# compile("llama3_2_3b", "q4f16_1", 4096, 1024, "Llama-3.2-3B-Instruct") +# compile("llama3_2_3b", "q4f32_1", 4096, 1024, "Llama-3.2-3B-Instruct") + +# compile("gemma2_2b-jpn", "q4f16_1", 4096, 1024, "gemma-2-2b-jpn-it") +# compile("gemma2_2b-jpn", "q4f32_1", 4096, 1024, "gemma-2-2b-jpn-it") + +# compile("smollm2_1_7b", "q0f16", 4096, 1024, "SmolLM2-1.7B-Instruct") +# compile("smollm2_1_7b", "q4f16_1", 4096, 1024, "SmolLM2-1.7B-Instruct") +# compile("smollm2_1_7b", "q4f32_1", 4096, 1024, "SmolLM2-1.7B-Instruct") + +# compile("smollm2_360m", "q0f16", 4096, 1024, "SmolLM2-360M-Instruct") +# compile("smollm2_360m", "q0f32", 4096, 1024, "SmolLM2-360M-Instruct") +# compile("smollm2_360m", "q4f16_1", 4096, 1024, "SmolLM2-360M-Instruct") +# compile("smollm2_360m", "q4f32_1", 4096, 1024, "SmolLM2-360M-Instruct") + +# compile("smollm2_135m", "q0f16", 4096, 1024, "SmolLM2-135M-Instruct") +# compile("smollm2_135m", "q0f32", 4096, 1024, "SmolLM2-135M-Instruct") +# compile("smollm2_135m", "q4f16_1", 4096, 1024, "SmolLM2-135M-Instruct") +# compile("smollm2_135m", "q4f32_1", 4096, 1024, "SmolLM2-135M-Instruct") + +# compile("gemma3_1b_it", "q4f16_1", 4096, 1024, "gemma3-1b-it") + + +# compile("qwen3_0.6b", "q4f16_1", 4096, 1024, "Qwen3-0.6B") +# compile("qwen3_0.6b", "q4f32_1", 4096, 1024, "Qwen3-0.6B") +# compile("qwen3_0.6b", "q0f16", 4096, 1024, "Qwen3-0.6B") +# compile("qwen3_0.6b", "q0f32", 4096, 1024, "Qwen3-0.6B") + +# compile("qwen3_1.7b", "q4f16_1", 4096, 1024, "Qwen3-1.7B") +# compile("qwen3_1.7b", "q4f32_1", 4096, 1024, "Qwen3-1.7B") + +# compile("qwen3_4b", "q4f16_1", 4096, 1024, "Qwen3-4B") +# compile("qwen3_4b", "q4f32_1", 4096, 1024, "Qwen3-4B") + +# compile("qwen3_8b", "q4f16_1", 4096, 1024, "Qwen3-8B") +# compile("qwen3_8b", "q4f32_1", 4096, 1024, "Qwen3-8B") + +# compile("qwen3_4b_instruct_2507", "q4f16_1", 4096, 1024, "Qwen3-4B-Instruct-2507") +# compile("qwen3_4b_instruct_2507", "q4f32_1", 4096, 1024, "Qwen3-4B-Instruct-2507") + +# compile("qwen3_4b_thinking_2507", "q4f16_1", 4096, 1024, "Qwen3-4B-Thinking-2507") +compile("qwen3_4b_thinking_2507", "q4f32_1", 4096, 1024, "Qwen3-4B-Thinking-2507") + diff --git a/web-llm-models/v0_2_80/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..89b9caf43d1d0aafc3204d7998fbbd5de879f820 --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1faaa2251812567475a76fe86fb1bbf29a7c3db4ae73b18773060bf2d7c6e8d7 +size 4530799 diff --git a/web-llm-models/v0_2_80/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..da95614b1aec2a5b686b5b43ce70c5c83c1a8657 --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8cfd32246359bb0c349017b6cdfa5ba863288863dd24318ee74fafa2e37430 +size 4503112 diff --git a/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..89b9caf43d1d0aafc3204d7998fbbd5de879f820 --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1faaa2251812567475a76fe86fb1bbf29a7c3db4ae73b18773060bf2d7c6e8d7 +size 4530799 diff --git a/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..da95614b1aec2a5b686b5b43ce70c5c83c1a8657 --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8cfd32246359bb0c349017b6cdfa5ba863288863dd24318ee74fafa2e37430 +size 4503112 diff --git a/web-llm-models/v0_2_80/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e57ef5d5cb810bc91700f1242030024e7ba84fc8 --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf510613e41d66b91d2001ba55be48a36d7c79f806b670cf3fb4bf48f1af50f +size 5087840 diff --git a/web-llm-models/v0_2_80/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..2842d8fc36536ab4c1d7ce88a5f5dd61b704ca0d --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4b04789f1e73394140005637846aac8f4d8db3010cd29d13a1aa560c971adc +size 5041859 diff --git a/web-llm-models/v0_2_80/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..a56e9a1ec8a8e3638f1e7e0e9641d629d6e1a0eb --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de56bb71bf51bf6924e88fea7e616ce1d59c52f9c40fcdc0dcd19f5ee5a501e +size 4235746 diff --git a/web-llm-models/v0_2_80/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..e2b77423084bd088af9cc75ef906934b6603639a --- /dev/null +++ b/web-llm-models/v0_2_80/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4560a713fb1636b5ad1a380b6e1543d3dca6eadecd461d0c80287d2fddc7953c +size 4168998 diff --git a/web-llm-models/v0_2_80/gemma3-1b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma3-1b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..080b606b9782ee46dd7f620fb4f3a8821a0df39b --- /dev/null +++ b/web-llm-models/v0_2_80/gemma3-1b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630fdbd726367dc647123fbc4d7dd473e7daed1c382eaa7b42ff769dbca0711a +size 5053215 diff --git a/web-llm-models/v0_2_80/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b128e5c058f72741812079f7170cd62804084dbd --- /dev/null +++ b/web-llm-models/v0_2_80/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f3fefc38d266d7f27a241f8386194dcbd4103b90eb990992af4d7efa8296a8 +size 4448319 diff --git a/web-llm-models/v0_2_80/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..ee9df8cbec755f76d261ad8068dfa65e04d3c8ef --- /dev/null +++ b/web-llm-models/v0_2_80/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9bfa66e6e9c9ee05a1da41169ff35f38faecc8eae1d29e3a5a4b2bab30fadd +size 4079567 diff --git a/web-llm-models/v0_2_80/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..948ffbde16635619fb67bfea9f99b730cfd789c1 --- /dev/null +++ b/web-llm-models/v0_2_80/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d1b75ac4dc594574830f45ca223e6d60123f57476a83f5645ca07aaaaa9d8b1 +size 4535905 diff --git a/web-llm-models/v0_2_80/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..3eeb5a5712babd0be70e3fda26d5c7c5951aaef2 --- /dev/null +++ b/web-llm-models/v0_2_80/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e3b77c6453c538307d8d9290e4758d4c9844a61289c2df197fc74370601cf4 +size 4508100 diff --git a/web-llm-models/v0_2_80/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..cbbb2846cf8a00b2e2853c45e7e692ccb19622a9 --- /dev/null +++ b/web-llm-models/v0_2_80/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cbeaa3ea894f475ce0a475e7cff16c2eeb964e9fcc96414ea82037c48eb54b +size 4711307 diff --git a/web-llm-models/v0_2_80/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..4090e8274f3074ae568594dee58e47cfe5d1b6ea --- /dev/null +++ b/web-llm-models/v0_2_80/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bf59b4b4ae4d9ccbdf965f16fcf60dc88d238051def52ce50a0d3c379659c7d +size 4679325 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..4a131373f1440e6b556cc68ec887c7a35d6bd41d --- /dev/null +++ b/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10a121186127774bcf6b6e2dcbcf9dc503c485dbbc3c3e7fb4153e457f81440 +size 2720636 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..b686fa47cb8c5f726e399fcb0c24b8de58c8ab15 --- /dev/null +++ b/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8163e4fa1e318f357a276b8dd7b71dde2705165e2aeb89a6b5700dd22ca0c3 +size 2720639 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..79cb64ee9291b4159264628484bed9b0f9fde821 --- /dev/null +++ b/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89478988d0ed16fdfade9517d7d8c69ed5aac671b3891ac9e329c64fb5a8d6b +size 2703661 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..d5493526e986cfcb5019a262ab7dd67e8105e707 --- /dev/null +++ b/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01afbc716fa17614533fefbb5ca3f20f5a9223be48ac10bf222e08ad2aece378 +size 2703663 diff --git a/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..0782654bdc225b6b38367496dffe95d7d7463b85 --- /dev/null +++ b/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc062e1865559bcd2a56a748dfae32a4ae9198ec2442eda52de50dd763676b32 +size 4510137 diff --git a/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..cdc5513109ba7de100e1a183c2d1a6c410712c6f --- /dev/null +++ b/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be81bd086647b1bce7174dc5ea775601bbd4b9cba75aac48cb4ea09a05096a04 +size 4480826