diff --git a/web-llm-models/v0_2_80/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index de9303f766f4e42e13902d5d130a35eb3ac132d2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-2-13b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5b4219693562cc5a3a198e017b83cb1e37a93c61529f925b1abd763566db28e5 -size 5867642 diff --git a/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index ed0070f3467d105e22c003d23f9184c5b526d481..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:16824420129661706fc37ab2682cee95b1b124b5f637918f9962dd255f826326 -size 5432524 diff --git a/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 279ab6662db07fc31888162e84db272a30ef5b10..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-2-7b-chat-hf-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b932162e61f885f1dd93f1a19a7126af973be480f8a3f6ba1834e488a924b864 -size 5210961 diff --git a/web-llm-models/v0_2_80/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 594f9154b016841e414233b374bb0a35cec3d767..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:830938512979859cd6164d8904b38e3d6e4ac625b0e05dcfbd179205e49297d6 -size 7894526 diff --git a/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 9b33e2cde49367faf382bf9b447cecf1fdf0e0fd..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:35d3461ad48a712a8e88c32d8dffa29e26db64fa30efd9d34fd06efdcf154a57 -size 5462970 diff --git a/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 433764ec52b931c23d55797aba69c312c4115d80..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a35c7934353bbe5a03c9e7a4f1b717a4e60aa13ac7659f7b7a368ab5e427d26d -size 5241749 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index b0f7038e95e60220d31d0fddb79c710110ef2077..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5cf1e920c3c5c23f63ca36490a533b4c5fad2cd88ac002b4c69f0201dab9194c -size 4418905 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 35a7f0a97a69d372f3017372b08389fa8a8574d8..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e085fcdbf451fd2e020a436f48f7a847e497603fdaed964eed2963998bbea81f -size 4325761 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 33af27b8dc72d26a536641abbdc1838cb39b3ee5..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:36d579738abb981f35847056680932aa4e10781a9fec2dfe21d220077293cdad -size 4657795 diff --git a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index d17ba5629f030f52c6676e5ed0a425fd5e0c806c..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3.2-1B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4be8362e40c748c484d7c342dec87f9efb4db13d0188ab8344bfa978a49df2cc -size 4540037 diff --git a/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 32485f0da00a25daa89c5ab3f0eb0902989a32bc..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ad7755fc12341fc983105e03f71a2170fcda7d93630efdd50a5c9b9e96f329e5 -size 5302431 diff --git a/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index e0bd104994635f8bdcf0cb59d5dff06854516104..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3.2-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:91fb3d3e7dcd91f758d3e0babea20f8aef688fd6dae8ebd7e3ccad340f88a9f8 -size 5101685 diff --git a/web-llm-models/v0_2_80/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index abc3e047c394d40b9bfba40d04d16fb21489e07d..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3_1-70B-Instruct-q3f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6d495540e8e391a84c3d1694c584dc1cc8686d57d268169dd91d1110baa4e952 -size 7903309 diff --git a/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index c718040f28087717711e0161284d6f99b52b0059..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8718b5a459c6fe6e47aa9ac193a2bb605828cad3e710bb66f0e0f34418d4e57f -size 5471751 diff --git a/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 6d13c661f8a144b2eae6629660c757a6f96f9083..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Llama-3_1-8B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ed45f31f897dbe1d41ad117b35b73dbd7cbca1365d230ddaf3b8c2681a835604 -size 5248471 diff --git a/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 603006943c578859d11b07163964692aa6ffac7e..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8babd2d77415bf663d4d708947c7db25680285932350a7f280c3cea3753abc5b -size 4615812 diff --git a/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 550b01a5b6d00d685895ec89902aa27ba6913ec3..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Mistral-7B-Instruct-v0.3-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:799d7fdf1888de1a90641c4a0896762d7a97a1f79623e2f84fd03c5d34867232 -size 4477233 diff --git a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-old-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-old-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 7d1a43f5b97484dd91d78c85b34aeeae77a3bfb5..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-old-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:251539b950c50592842cbdc4685fa6e87a2d2f01020eb2398800107223a55457 -size 4621036 diff --git a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 7d1a43f5b97484dd91d78c85b34aeeae77a3bfb5..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:251539b950c50592842cbdc4685fa6e87a2d2f01020eb2398800107223a55457 -size 4621036 diff --git a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index dfc758b4428ddbe4886b9564f97e284ebf371336..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3-mini-4k-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e88ba4ef7898f6ae3c5be4d8a029d665f380e1a5e2ea1447f7e0c4622d0e3f41 -size 4497612 diff --git a/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index a06d6bfe1bf1891e2b47a5c526612e81a58a3371..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fc2f7c0760b3ca2ad9055267aaa3ddc8989d57802362958223a49ac3fbc96aff -size 4626576 diff --git a/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 56951f252935772fa9078591faa6063f0ecf6bb6..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3.5-mini-instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3f826e45c9955a692f0e9b96701337fac527f3a8d2e18caf4f9c5d068d057d05 -size 4502793 diff --git a/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm deleted file mode 100644 index 3f78508ef9b728c414105ea062e8e93417bce6fb..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1a1827e7c9679f68eea59b6d2baef1fe9d42b9748678ee0bc393795c915d1816 -size 6146107 diff --git a/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm b/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm deleted file mode 100644 index 48e547dcf8694856ec5295bdced35522d9854d1a..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Phi-3.5-vision-instruct-q4f32_1-ctx4k_cs2k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d4d6c9d9fa9286ae0ebb692804ac6898294e251b537644994f9c6f78cf54ae4c -size 6009000 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index bcd5230901873ab825027786bb144162243564ed..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a7043670804ddfe408ab96d83e5f5637c413aaf9e386cbd7d2ca6ded4e648179 -size 4088133 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index fbaafed73ac3a692a3e7ec3b5f643dfee21f21e1..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:21bc66498f545b298a968a039979f7d1f6bde85f1653099fc0c0df3d00097300 -size 4058892 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 74ccfb2c85e6990f70e34874d0dd8cc30a85f580..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:627e26cb89b457ef02480912f147f8b7126f2e50cbcba6ac553aa1b142ae0822 -size 4133881 diff --git a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-testtokenizer-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-testtokenizer-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 80fee093c9957ef811f29e2506e62e1ef5690cf8..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-0.5B-Instruct-testtokenizer-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bee55eef3064f287287d87473301f51890991c998c91437387ed844bcbcf3b84 -size 4162181 diff --git a/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 1e916273ea949499a1809712f1920b2a6287a333..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:abb9b4cf41ae2a87f0762df6a3e50a3b9f361fd0138316fa38f1986f7abedd26 -size 4541432 diff --git a/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index c911e0fc59c6f7e9049bbb73e310b0e6a438b4f3..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4f75a009bc20fe4f1ca47cc5b0983e4d8c946d1c51515e268e92bea421b8ca1c -size 4421335 diff --git a/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 00fd8e391eb96325d941e275c2d311065a23ad2c..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e30bd67251a3b4967ce5d7d738b121eddb543ed650cf5adf5bf1d80f9e205b3 -size 4656226 diff --git a/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 0b4c9b2f871f25e61d32d1dc609ec67a1092116e..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2-7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f9d33e7b9963d1adbcb148327b0015c7d7099cdf50b3423b7fec469f494e4373 -size 4528253 diff --git a/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 49946c4f90e8b6fef5ed3a9966a85ec729ba188c..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:806c019a9e17987a18bd73380f38ad4ea2dfb686a2e088a8b7939ab139f02f07 -size 4761165 diff --git a/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 04f4cae95d31b6df6e7cef93ad640face92666a9..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen2.5-3B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9bab183552e418d3a719372fa1813e4875133e5ea6e2c8053d5f63b8383031db -size 4619438 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index f037e293181c6620bdbfea73c6939c47233bb50b..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-0.6B-q0f16-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3725b9724afacda54874e2bfe1723737cd006ef1283c20099437530625e5e4df -size 4728697 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 27399f5188283ba86a058852049234c20ffe4356..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-0.6B-q0f32-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3b8e45c3af21d6d43e7816e2a0108dee260c426940b0f790dc3bc3d40c2b32e3 -size 4636240 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 02083b22c2384cc78b31b669b74c51af941322b2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-0.6B-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:56d785a162b3cbb2fded342e856e321fa5328ce9da5fa151fcba71e56024ad93 -size 4923843 diff --git a/web-llm-models/v0_2_80/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 482273074e11bf97ed4103c6597eb8e3f84ecebe..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-0.6B-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:292fa0e4e75fb9defe1c48254bce2795a990442529a086df19587d1db42b38b3 -size 4807405 diff --git a/web-llm-models/v0_2_80/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 4f789db8ef279e49b31257cfa29afd088b7a40db..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-1.7B-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b3d8290e1b94c4b474e7126289cb7991a69ed2862952b32c0352403238bf9b01 -size 4954364 diff --git a/web-llm-models/v0_2_80/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 3f3424521ff7294a78e67edffd8cd41aee9e77b9..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-1.7B-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5ceaace42da8820ca10a7be244cae90df761592dac766a5f3e38632254377ab0 -size 4832975 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 00ad4bfd68f1baff40f8642e816f046111745874..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e9e9bef2e4e75abe8db6fb06189f908ea57935735473da6b7dcce93cadcb0f7 -size 5239948 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 49af8c2c2871c7a6f5e9f0fb420c01d8c4ea03d0..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-4B-Instruct-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:04549118d7e45e724615a29fa893601b4f8a46399ec6c8dbb5504c2fb5e5ce82 -size 5096403 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 00ad4bfd68f1baff40f8642e816f046111745874..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e9e9bef2e4e75abe8db6fb06189f908ea57935735473da6b7dcce93cadcb0f7 -size 5239948 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 49af8c2c2871c7a6f5e9f0fb420c01d8c4ea03d0..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-4B-Thinking-2507-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:04549118d7e45e724615a29fa893601b4f8a46399ec6c8dbb5504c2fb5e5ce82 -size 5096403 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index f9555c9974f65086d0b4584983935f43222db217..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-4B-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:341aafc07e222f37e8edc7d466d5780b195723e7a80eb58fcd46b7444a4a879d -size 5239948 diff --git a/web-llm-models/v0_2_80/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 23c98f6ad2f909698173af3dbd6b4624ae8ce6a2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-4B-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:874a8d0ca74d5d90eead4e5e6d6142b17316a211816d068d6c094f8b86f57f11 -size 5096403 diff --git a/web-llm-models/v0_2_80/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index a2b02904dc3fa59b61767138604b1e5d1683d875..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-8B-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cb5c0b053def967400622d893b438bdf62e74d16e6bd97aabb3c71ca5fefa850 -size 5249209 diff --git a/web-llm-models/v0_2_80/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 118a95a37f2d31e99c63508f16b11aadc2e55391..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/Qwen3-8B-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4475d9accb042f807b4f5004584ebbca9abf5659c8ce7b2b4edd01e031347381 -size 5100016 diff --git a/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index a0393d4ffa2a727ef06bf7c87a8de8db986f1156..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f16_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2ac8742d3ebfe8d73dee65b7f9ad028b9b3684429f372aee08498474a05f9e24 -size 4913981 diff --git a/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 0b833b5299170f4428a92f0a617b44fc186678af..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/RedPajama-INCITE-Chat-3B-v1-q4f32_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0cff4ac94d9a1b51bda503f762b5fa1c1307ee851a1e5fdb8aadd7e225bc8e8f -size 4867021 diff --git a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index abe7da82a2d01a3853aa1823774323e92722cc62..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:29b4280a39df222869a5a19ed5ea3400742243048b643c3e621df4aab04b07d3 -size 4737987 diff --git a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index e5b8fe5dd1fccf9a0f1a62ff80ed8f57ec8bb85f..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b6fc09134d32e16a47fd117eb6411c99488806a0bbf881874d58e5ff00dd5290 -size 5026864 diff --git a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 07b991ce2c32ed3f915364f6633d02db5891f64d..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-1.7B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4bd275e0055d9f21be53dfb443dbcf7444b9d8d9d39eea1f5b96377c007bcc68 -size 4869922 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index c2b599d9b95abd037baabf5596b14e0448aeb7cb..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4b3c6f201de25b20301562dd571fc8f2b859596df09a1b29535d0fe04702c322 -size 4703557 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index e8b5fd70fddb14624aabef58b38893421ee26ab8..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e792ea4dd15eb352775224490f31229ab805cd3f768cba339473d339ac916ef1 -size 4674751 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 0766454192b18b12be734a64e1b3d4fd903f9d82..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:02e3b4da928bcbc051335cbbac501e40eaae1cb4f2a4ab196cb1fffcceee3aa7 -size 5023498 diff --git a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 506d7236417d93d71532ba35d34294430c6abe4e..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-135M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2892b3f4fd2fa672b3568a4995124c4331989e2f8d985af26071e3b34ee82801 -size 4994608 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index b5cf1aa3cea574275758ffd116ed8cb1fb2cf4a2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f16-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8a0f50bebcd5b9b55d569cd9f605bc197e9a5e899ef80529dda705cc446541fe -size 4825417 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 06623902922ab5070db82858f9bb70a936082904..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q0f32-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:75c5602d923eea8b6d4e19d65d0f5f932129a8b1ed2f1367d75f64f64ba580ea -size 4796086 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index c577792264f2f1e7a28533ca0c1630ae510d9f00..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d07d1bb06ce2455da8a2aab9bce9a746cb56ed4177611a7a33141cae4b422a79 -size 5056973 diff --git a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 00f204362feaa3a3257879116ec3f4f827a4b36b..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/SmolLM2-360M-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:09434111064e168afc361d34925cbc776b108fa92d09b602f78517f417335804 -size 5027616 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index beb8f7085fe8454de22c68617d5392cb0a16be74..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f16-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9c075fd75e08b580a80d44ca63f45f0c9fc67313c25afdeff9e002901a141d0b -size 4665014 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 88dca71ad6f7b41c232edc1af3846e5daf517278..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q0f32-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:78b9f19791b15bd7a9bf5da45338b91ee8c9025e2e0092a5d96f4f1ef9234724 -size 4533418 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index d14c055b6476d44a15d895de28082b511c89f6b2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f16_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ef51c2e76fc1bb5e055edf961b84af026f6626d13533eb13a914e6a1e640c970 -size 4938116 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 1104b4fcc6f2305612ae040678adb6c4e8fe0504..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v0.4-q4f32_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a008cfbc8aea6047638edd32330c29e17eaf436c316e64c66050d85831f5074a -size 4791630 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index d14c055b6476d44a15d895de28082b511c89f6b2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f16_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ef51c2e76fc1bb5e055edf961b84af026f6626d13533eb13a914e6a1e640c970 -size 4938116 diff --git a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 1104b4fcc6f2305612ae040678adb6c4e8fe0504..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/TinyLlama-1.1B-Chat-v1.0-q4f32_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a008cfbc8aea6047638edd32330c29e17eaf436c316e64c66050d85831f5074a -size 4791630 diff --git a/web-llm-models/v0_2_80/compile_wasm.py b/web-llm-models/v0_2_80/compile_wasm.py deleted file mode 100644 index 0467c01d9b2d7c9916a00e5f2dc598e3534b045b..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/compile_wasm.py +++ /dev/null @@ -1,274 +0,0 @@ -import os -import subprocess -import sys -from pathlib import Path - -LOG_PATH = Path("./") / "compile_wasm_log.txt" -# NOTE(Harry): Set this to your binary-mlc-llm-libs repo. -BINARY_DIR = "/path/to/binary-mlc-llm-libs/web-llm-models/v0_2_80" - -# -1. Clean log file -cmd = [ - "rm", - "-rf", - "./compile_wasm_log.txt", -] -print(" ".join(cmd), flush=True) -subprocess.run(cmd, check=True, stderr=subprocess.STDOUT, env=os.environ) - - -def compile( - model, - quantization, - context_window_size, - prefill_chunk_size, - model_id, - use_sliding_window=False, - max_batch_size=None, -): - with LOG_PATH.open("a", encoding="utf-8") as log_file: - # 0. Clean temp folder - cmd = [ - "rm", - "-rf", - "dist/temp/", - ] - print(" ".join(cmd), flush=True) - subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) - - # 1. Gen config - cmd = [ - sys.executable, - "-m", - "mlc_llm", - "gen_config", - model, - "--output", - "dist/temp", - "--conv-template", - "LM", - "--quantization", - quantization, - "--prefill-chunk-size", - str(prefill_chunk_size), - ] - if use_sliding_window: - cmd += [ - "--sliding-window-size", - str(context_window_size), - ] - else: - cmd += [ - "--context-window-size", - str(context_window_size), - ] - if max_batch_size: - cmd += [ - "--max-batch-size", - str(max_batch_size), - ] - print(" ".join(cmd), flush=True) - subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) - - # 2. compile - - # 2.1. Get output wasm name - ctx = "" - if context_window_size == 4096: - ctx = "4k" - elif context_window_size == 2048: - ctx = "2k" - elif context_window_size == 1024: - ctx = "1k" - elif context_window_size == 512: - ctx = "512" - else: - raise RuntimeError(f"Unrecognized ctx: {ctx}") - - cs = "" - if prefill_chunk_size == 4096: - cs = "4k" - elif prefill_chunk_size == 2048: - cs = "2k" - elif prefill_chunk_size == 1024: - cs = "1k" - elif prefill_chunk_size == 512: - cs = "512" - else: - raise RuntimeError(f"Unrecognized cs: {cs}") - - # e.g. Llama-3-8B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm - if use_sliding_window: - output_file_name = f"{model_id}-{quantization}-sw{ctx}_cs{cs}" - else: - output_file_name = f"{model_id}-{quantization}-ctx{ctx}_cs{cs}" - if max_batch_size: - output_file_name += f"_batch{max_batch_size}" - output_file_name += "-webgpu.wasm" - output_path = os.path.join(BINARY_DIR, output_file_name) - - # 2.2. Compile - cmd = [ - sys.executable, - "-m", - "mlc_llm", - "compile", - "dist/temp/mlc-chat-config.json", - "--device", - "webgpu", - "--output", - output_path, - ] - print(" ".join(cmd), flush=True) - subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) - - # 3. Clean temp mlc-chat-config.json - cmd = [ - "rm", - "-rf", - "dist/temp/mlc-chat-config.json", - ] - print(" ".join(cmd), flush=True) - subprocess.run(cmd, check=True, stdout=log_file, stderr=subprocess.STDOUT, env=os.environ) - - -# NOTE(Charlie): As of 03/31/2025, the context window size does not do anything because -# it has become a runtime thing in both MLC-LLM and WebLLM. - -# NOTE(Harry): To compile a wasm, uncomment the corresponding line below. - -# compile("phi-3", "q4f16_1", 4096, 1024, "Phi-3-mini-4k-instruct") -# compile("phi-3", "q4f16_1", 4096, 1024, "Phi-3-mini-4k-instruct-old") -# compile("phi-3", "q4f32_1", 4096, 1024, "Phi-3-mini-4k-instruct") - -# compile("llama3_8b", "q4f16_1", 4096, 1024, "Llama-3-8B-Instruct") -# compile("llama3_8b", "q4f32_1", 4096, 1024, "Llama-3-8B-Instruct") - -# compile("llama2_7b", "q4f16_1", 4096, 1024, "Llama-2-7b-chat-hf") -# compile("llama2_7b", "q4f32_1", 4096, 1024, "Llama-2-7b-chat-hf") - -# compile("llama2_13b", "q4f16_1", 4096, 1024, "Llama-2-13b-chat-hf") - -# compile("mistral_7b_v03", "q4f16_1", 4096, 1024, "Mistral-7B-Instruct-v0.3") -# compile("mistral_7b_v03", "q4f32_1", 4096, 1024, "Mistral-7B-Instruct-v0.3") - -# compile("redpajama_3b_v1", "q4f16_1", 2048, 1024, "RedPajama-INCITE-Chat-3B-v1") -# compile("redpajama_3b_v1", "q4f32_1", 2048, 1024, "RedPajama-INCITE-Chat-3B-v1") - -# compile("tinyllama_1b_chat_v0.4", "q0f16", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") -# compile("tinyllama_1b_chat_v0.4", "q0f32", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") -# compile("tinyllama_1b_chat_v0.4", "q4f16_1", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") -# compile("tinyllama_1b_chat_v0.4", "q4f32_1", 2048, 1024, "TinyLlama-1.1B-Chat-v0.4") - -# compile("tinyllama_1b_chat_v1.0", "q4f16_1", 2048, 1024, "TinyLlama-1.1B-Chat-v1.0") -# compile("tinyllama_1b_chat_v1.0", "q4f32_1", 2048, 1024, "TinyLlama-1.1B-Chat-v1.0") - -# compile("gemma_2b", "q4f16_1", 4096, 1024, "gemma-2b-it") -# compile("gemma_2b", "q4f32_1", 4096, 1024, "gemma-2b-it") - -# compile("gpt2_medium", "q0f16", 1024, 1024, "gpt2-medium") -# compile("gpt2", "q0f16", 1024, 1024, "gpt2") - -# compile("phi-1_5", "q4f16_1", 2048, 1024, "phi-1_5") -# compile("phi-1_5", "q4f32_1", 2048, 1024, "phi-1_5") - -# compile("phi-2", "q4f16_1", 2048, 1024, "phi-2") -# compile("phi-2", "q4f32_1", 2048, 1024, "phi-2") - -# compile("stablelm-2-zephyr-1_6b", "q4f16_1", 4096, 1024, "stablelm-2-zephyr-1_6b") -# compile("stablelm-2-zephyr-1_6b", "q4f32_1", 4096, 1024, "stablelm-2-zephyr-1_6b") - -# compile("qwen2_0_5b", "q4f16_1", 4096, 1024, "Qwen2-0.5B-Instruct") -# compile("qwen2_0_5b", "q4f32_1", 4096, 1024, "Qwen2-0.5B-Instruct") -# compile("qwen2_0_5b", "q0f16", 4096, 1024, "Qwen2-0.5B-Instruct") -# compile("qwen2_0_5b", "q0f32", 4096, 1024, "Qwen2-0.5B-Instruct") - -# compile("qwen2_1_5b", "q4f16_1", 4096, 1024, "Qwen2-1.5B-Instruct") -# compile("qwen2_1_5b", "q4f32_1", 4096, 1024, "Qwen2-1.5B-Instruct") - -# compile("qwen2.5_3b", "q4f16_1", 4096, 1024, "Qwen2.5-3B-Instruct") -# compile("qwen2.5_3b", "q4f32_1", 4096, 1024, "Qwen2.5-3B-Instruct") - -# compile("qwen2_7b", "q4f16_1", 4096, 1024, "Qwen2-7B-Instruct") -# compile("qwen2_7b", "q4f32_1", 4096, 1024, "Qwen2-7B-Instruct") - -# compile("llama3_70b", "q3f16_1", 4096, 1024, "Llama-3-70B-Instruct") - -# compile("llama3_1_8b", "q4f16_1", 4096, 1024, "Llama-3_1-8B-Instruct") -# compile("llama3_1_8b", "q4f32_1", 4096, 1024, "Llama-3_1-8B-Instruct") - -# compile("llama3_1_70b", "q3f16_1", 4096, 1024, "Llama-3_1-70B-Instruct") - -# compile("gemma2_2b", "q4f16_1", 4096, 1024, "gemma-2-2b-it") -# compile("gemma2_2b", "q4f32_1", 4096, 1024, "gemma-2-2b-it") - -# compile("gemma2_9b", "q4f16_1", 4096, 1024, "gemma-2-9b-it") -# compile("gemma2_9b", "q4f32_1", 4096, 1024, "gemma-2-9b-it") - -# # max_position_embeddings is set to be 512 here for embedding model; no rope is used -# compile( -# "snowflake-arctic-embed-m", "q0f32", 512, 512, "snowflake-arctic-embed-m", max_batch_size=32 -# ) -# compile("snowflake-arctic-embed-m", "q0f32", 512, 512, "snowflake-arctic-embed-m", max_batch_size=4) - -# compile( -# "snowflake-arctic-embed-s", "q0f32", 512, 512, "snowflake-arctic-embed-s", max_batch_size=32 -# ) -# compile("snowflake-arctic-embed-s", "q0f32", 512, 512, "snowflake-arctic-embed-s", max_batch_size=4) - -# # Cannot be shared with phi-3 because phi3.5 has rope scaling -# compile("phi-3_5", "q4f16_1", 4096, 1024, "Phi-3.5-mini-instruct") -# compile("phi-3_5", "q4f32_1", 4096, 1024, "Phi-3.5-mini-instruct") - -# compile("phi-3_5-vision", "q4f16_1", 4096, 2048, "Phi-3.5-vision-instruct") -# compile("phi-3_5-vision", "q4f32_1", 4096, 2048, "Phi-3.5-vision-instruct") - -# # Llama3.2 1B/3B -# compile("llama3_2_1b", "q0f16", 4096, 1024, "Llama-3.2-1B-Instruct") -# compile("llama3_2_1b", "q0f32", 4096, 1024, "Llama-3.2-1B-Instruct") -# compile("llama3_2_1b", "q4f16_1", 4096, 1024, "Llama-3.2-1B-Instruct") -# compile("llama3_2_1b", "q4f32_1", 4096, 1024, "Llama-3.2-1B-Instruct") - -# compile("llama3_2_3b", "q4f16_1", 4096, 1024, "Llama-3.2-3B-Instruct") -# compile("llama3_2_3b", "q4f32_1", 4096, 1024, "Llama-3.2-3B-Instruct") - -# compile("gemma2_2b-jpn", "q4f16_1", 4096, 1024, "gemma-2-2b-jpn-it") -# compile("gemma2_2b-jpn", "q4f32_1", 4096, 1024, "gemma-2-2b-jpn-it") - -# compile("smollm2_1_7b", "q0f16", 4096, 1024, "SmolLM2-1.7B-Instruct") -# compile("smollm2_1_7b", "q4f16_1", 4096, 1024, "SmolLM2-1.7B-Instruct") -# compile("smollm2_1_7b", "q4f32_1", 4096, 1024, "SmolLM2-1.7B-Instruct") - -# compile("smollm2_360m", "q0f16", 4096, 1024, "SmolLM2-360M-Instruct") -# compile("smollm2_360m", "q0f32", 4096, 1024, "SmolLM2-360M-Instruct") -# compile("smollm2_360m", "q4f16_1", 4096, 1024, "SmolLM2-360M-Instruct") -# compile("smollm2_360m", "q4f32_1", 4096, 1024, "SmolLM2-360M-Instruct") - -# compile("smollm2_135m", "q0f16", 4096, 1024, "SmolLM2-135M-Instruct") -# compile("smollm2_135m", "q0f32", 4096, 1024, "SmolLM2-135M-Instruct") -# compile("smollm2_135m", "q4f16_1", 4096, 1024, "SmolLM2-135M-Instruct") -# compile("smollm2_135m", "q4f32_1", 4096, 1024, "SmolLM2-135M-Instruct") - -# compile("gemma3_1b_it", "q4f16_1", 4096, 1024, "gemma3-1b-it") - - -# compile("qwen3_0.6b", "q4f16_1", 4096, 1024, "Qwen3-0.6B") -# compile("qwen3_0.6b", "q4f32_1", 4096, 1024, "Qwen3-0.6B") -# compile("qwen3_0.6b", "q0f16", 4096, 1024, "Qwen3-0.6B") -# compile("qwen3_0.6b", "q0f32", 4096, 1024, "Qwen3-0.6B") - -# compile("qwen3_1.7b", "q4f16_1", 4096, 1024, "Qwen3-1.7B") -# compile("qwen3_1.7b", "q4f32_1", 4096, 1024, "Qwen3-1.7B") - -# compile("qwen3_4b", "q4f16_1", 4096, 1024, "Qwen3-4B") -# compile("qwen3_4b", "q4f32_1", 4096, 1024, "Qwen3-4B") - -# compile("qwen3_8b", "q4f16_1", 4096, 1024, "Qwen3-8B") -# compile("qwen3_8b", "q4f32_1", 4096, 1024, "Qwen3-8B") - -# compile("qwen3_4b_instruct_2507", "q4f16_1", 4096, 1024, "Qwen3-4B-Instruct-2507") -# compile("qwen3_4b_instruct_2507", "q4f32_1", 4096, 1024, "Qwen3-4B-Instruct-2507") - -# compile("qwen3_4b_thinking_2507", "q4f16_1", 4096, 1024, "Qwen3-4B-Thinking-2507") -compile("qwen3_4b_thinking_2507", "q4f32_1", 4096, 1024, "Qwen3-4B-Thinking-2507") - diff --git a/web-llm-models/v0_2_80/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 89b9caf43d1d0aafc3204d7998fbbd5de879f820..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1faaa2251812567475a76fe86fb1bbf29a7c3db4ae73b18773060bf2d7c6e8d7 -size 4530799 diff --git a/web-llm-models/v0_2_80/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index da95614b1aec2a5b686b5b43ce70c5c83c1a8657..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7e8cfd32246359bb0c349017b6cdfa5ba863288863dd24318ee74fafa2e37430 -size 4503112 diff --git a/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 89b9caf43d1d0aafc3204d7998fbbd5de879f820..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1faaa2251812567475a76fe86fb1bbf29a7c3db4ae73b18773060bf2d7c6e8d7 -size 4530799 diff --git a/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index da95614b1aec2a5b686b5b43ce70c5c83c1a8657..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7e8cfd32246359bb0c349017b6cdfa5ba863288863dd24318ee74fafa2e37430 -size 4503112 diff --git a/web-llm-models/v0_2_80/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index e57ef5d5cb810bc91700f1242030024e7ba84fc8..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2-9b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ecf510613e41d66b91d2001ba55be48a36d7c79f806b670cf3fb4bf48f1af50f -size 5087840 diff --git a/web-llm-models/v0_2_80/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 2842d8fc36536ab4c1d7ce88a5f5dd61b704ca0d..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2-9b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4c4b04789f1e73394140005637846aac8f4d8db3010cd29d13a1aa560c971adc -size 5041859 diff --git a/web-llm-models/v0_2_80/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index a56e9a1ec8a8e3638f1e7e0e9641d629d6e1a0eb..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7de56bb71bf51bf6924e88fea7e616ce1d59c52f9c40fcdc0dcd19f5ee5a501e -size 4235746 diff --git a/web-llm-models/v0_2_80/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index e2b77423084bd088af9cc75ef906934b6603639a..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma-2b-it-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4560a713fb1636b5ad1a380b6e1543d3dca6eadecd461d0c80287d2fddc7953c -size 4168998 diff --git a/web-llm-models/v0_2_80/gemma3-1b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gemma3-1b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 080b606b9782ee46dd7f620fb4f3a8821a0df39b..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gemma3-1b-it-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:630fdbd726367dc647123fbc4d7dd473e7daed1c382eaa7b42ff769dbca0711a -size 5053215 diff --git a/web-llm-models/v0_2_80/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm deleted file mode 100644 index b128e5c058f72741812079f7170cd62804084dbd..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gpt2-medium-q0f16-ctx1k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e7f3fefc38d266d7f27a241f8386194dcbd4103b90eb990992af4d7efa8296a8 -size 4448319 diff --git a/web-llm-models/v0_2_80/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm deleted file mode 100644 index ee9df8cbec755f76d261ad8068dfa65e04d3c8ef..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/gpt2-q0f16-ctx1k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1c9bfa66e6e9c9ee05a1da41169ff35f38faecc8eae1d29e3a5a4b2bab30fadd -size 4079567 diff --git a/web-llm-models/v0_2_80/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 948ffbde16635619fb67bfea9f99b730cfd789c1..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/phi-1_5-q4f16_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9d1b75ac4dc594574830f45ca223e6d60123f57476a83f5645ca07aaaaa9d8b1 -size 4535905 diff --git a/web-llm-models/v0_2_80/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 3eeb5a5712babd0be70e3fda26d5c7c5951aaef2..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/phi-1_5-q4f32_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f4e3b77c6453c538307d8d9290e4758d4c9844a61289c2df197fc74370601cf4 -size 4508100 diff --git a/web-llm-models/v0_2_80/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index cbbb2846cf8a00b2e2853c45e7e692ccb19622a9..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/phi-2-q4f16_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:36cbeaa3ea894f475ce0a475e7cff16c2eeb964e9fcc96414ea82037c48eb54b -size 4711307 diff --git a/web-llm-models/v0_2_80/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm deleted file mode 100644 index 4090e8274f3074ae568594dee58e47cfe5d1b6ea..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/phi-2-q4f32_1-ctx2k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2bf59b4b4ae4d9ccbdf965f16fcf60dc88d238051def52ce50a0d3c379659c7d -size 4679325 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm deleted file mode 100644 index 4a131373f1440e6b556cc68ec887c7a35d6bd41d..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch32-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a10a121186127774bcf6b6e2dcbcf9dc503c485dbbc3c3e7fb4153e457f81440 -size 2720636 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm deleted file mode 100644 index b686fa47cb8c5f726e399fcb0c24b8de58c8ab15..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/snowflake-arctic-embed-m-q0f32-ctx512_cs512_batch4-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fa8163e4fa1e318f357a276b8dd7b71dde2705165e2aeb89a6b5700dd22ca0c3 -size 2720639 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm deleted file mode 100644 index 79cb64ee9291b4159264628484bed9b0f9fde821..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch32-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a89478988d0ed16fdfade9517d7d8c69ed5aac671b3891ac9e329c64fb5a8d6b -size 2703661 diff --git a/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm b/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm deleted file mode 100644 index d5493526e986cfcb5019a262ab7dd67e8105e707..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/snowflake-arctic-embed-s-q0f32-ctx512_cs512_batch4-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:01afbc716fa17614533fefbb5ca3f20f5a9223be48ac10bf222e08ad2aece378 -size 2703663 diff --git a/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index 0782654bdc225b6b38367496dffe95d7d7463b85..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f16_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bc062e1865559bcd2a56a748dfae32a4ae9198ec2442eda52de50dd763676b32 -size 4510137 diff --git a/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm b/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm deleted file mode 100644 index cdc5513109ba7de100e1a183c2d1a6c410712c6f..0000000000000000000000000000000000000000 --- a/web-llm-models/v0_2_80/stablelm-2-zephyr-1_6b-q4f32_1-ctx4k_cs1k-webgpu.wasm +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:be81bd086647b1bce7174dc5ea775601bbd4b9cba75aac48cb4ea09a05096a04 -size 4480826