diff --git a/README.md b/README.md index 3eafda35bba756999dd05742cb7754953f91779c..2a91db54cd6048b3868cc7774218e80cc687cc20 100644 --- a/README.md +++ b/README.md @@ -35,50 +35,18 @@ More details on model performance across various devices, can be found | Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model |---|---|---|---|---|---|---|---|---| -| WhisperSmallEncoderQuantizable | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 128.052 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_CONTEXT_BINARY | 112.608 ms | 1 - 21 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 62.325 ms | 1 - 3 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 62.524 ms | 0 - 115 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 58.95 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_CONTEXT_BINARY | 613.165 ms | 1 - 13 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | PRECOMPILED_QNN_ONNX | 612.722 ms | 29 - 40 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 128.052 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 61.478 ms | 0 - 3 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8295P ADP | Qualcomm® SA8295P | QNN_CONTEXT_BINARY | 80.04 ms | 1 - 17 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 62.303 ms | 1 - 3 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 58.95 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 43.635 ms | 1 - 19 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 44.395 ms | 56 - 75 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | QNN_CONTEXT_BINARY | 35.072 ms | 1 - 14 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 36.148 ms | 54 - 67 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 7 Gen 5 QRD | Snapdragon® 7 Gen 5 Mobile | QNN_CONTEXT_BINARY | 191.005 ms | 1 - 15 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 7 Gen 5 QRD | Snapdragon® 7 Gen 5 Mobile | PRECOMPILED_QNN_ONNX | 184.911 ms | 54 - 63 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | QNN_CONTEXT_BINARY | 28.292 ms | 0 - 12 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 28.678 ms | 61 - 72 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 61.61 ms | 0 - 0 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 61.896 ms | 108 - 108 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 13.422 ms | 27 - 36 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_CONTEXT_BINARY | 11.469 ms | 29 - 46 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 8.49 ms | 30 - 33 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 8.83 ms | 30 - 32 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 9.441 ms | 24 - 34 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_CONTEXT_BINARY | 32.888 ms | 27 - 38 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | PRECOMPILED_QNN_ONNX | 34.862 ms | 37 - 49 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 13.422 ms | 27 - 36 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 8.26 ms | 35 - 37 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8295P ADP | Qualcomm® SA8295P | QNN_CONTEXT_BINARY | 10.538 ms | 30 - 46 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 8.403 ms | 26 - 28 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 9.441 ms | 24 - 34 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 6.394 ms | 30 - 48 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 6.854 ms | 38 - 57 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | QNN_CONTEXT_BINARY | 4.825 ms | 28 - 42 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 5.182 ms | 26 - 42 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 7 Gen 5 QRD | Snapdragon® 7 Gen 5 Mobile | QNN_CONTEXT_BINARY | 11.331 ms | 30 - 45 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 7 Gen 5 QRD | Snapdragon® 7 Gen 5 Mobile | PRECOMPILED_QNN_ONNX | 11.918 ms | 38 - 50 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | QNN_CONTEXT_BINARY | 4.047 ms | 28 - 40 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 4.395 ms | 37 - 48 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 7.733 ms | 30 - 30 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 7.756 ms | 186 - 186 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 62.444 ms | 0 - 113 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | PRECOMPILED_QNN_ONNX | 612.628 ms | 52 - 63 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 45.312 ms | 56 - 75 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 35.236 ms | 63 - 78 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 30.325 ms | 61 - 72 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 61.693 ms | 107 - 107 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 8.647 ms | 0 - 192 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | PRECOMPILED_QNN_ONNX | 33.594 ms | 37 - 49 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 6.715 ms | 38 - 56 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 5.136 ms | 27 - 42 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 4.357 ms | 38 - 48 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 7.792 ms | 185 - 185 MB | NPU | Use Export Script | diff --git a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index 530d6073d38e527d0ffd86ce03b46f63e4f25cf1..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ddc997b35f6ed3a6791734bc03a0fbeaf0edfd423dfa1c306a5863f8f9eab57a -size 223879168 diff --git a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 06e6e26e7aeec639e4c6adbd9555b9e9940459cf..24f0014f8939f34b08f62c2f759a34213e85ad99 100644 --- a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a6910473b32f3f42e074b7effa5d7f90a46b3604e3772bd801cc1a72bf9019fe -size 193518242 +oid sha256:721564bbd831d19ff49da30758f26e915ce7c3c0476fd54e6499978dd418eb2c +size 193518243 diff --git a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 047975c44e4e5d74cbb65ccc926b73fbb75bb51b..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:14a567f9876799271f59773500e1abae07d5acd12f189cb39641d7c1b2fcf5c0 -size 139366400 diff --git a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 87c90fa340f095864925a78fd974df902cc46d94..435d1b90f39929bc420ab1d38d68a18b247fd3b2 100644 --- a/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs6490-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f1f1b59bfe33bf27d3f9c71203f3ee359e0f4c99a600a2a44a0ae53063c513b -size 102104980 +oid sha256:3124dd79bfc2734e25871e7c5cb65dda50e4c45b5f24a582dea0de723d22c295 +size 102104982 diff --git a/precompiled/qualcomm-qcs6490-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs6490-proxy/tool-versions.yaml index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..2651df2a5778b3f91e7ee070551106ab67282c06 100644 --- a/precompiled/qualcomm-qcs6490-proxy/tool-versions.yaml +++ b/precompiled/qualcomm-qcs6490-proxy/tool-versions.yaml @@ -1,4 +1,4 @@ tool_versions: precompiled_qnn_onnx: qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 + onnx_runtime: 1.23.0 diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index 4d322d4ec033421fea25ecf4cc7040db9829c349..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:be9d53a61cd042767ed23fe9a4bd948a55500ec4466241bbe14fd126c916ddff -size 225382400 diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 2ad842198aaf65e08d6a212a8f4f38c050ddebe4..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d0ae251ada265b7ef935120145f582294d148b0cc1f1287fee1f27440bfd27f4 -size 111763456 diff --git a/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml deleted file mode 100644 index edfd7276ba749d5e85820422e59493b95251fdbf..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126-auto diff --git a/precompiled/qualcomm-qcs8450-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8450-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index 54e0c725d9d888b08bf5201637c84a6212c402f2..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8450-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:149d1cc2dd6a5a199dfc87746e35b0bfc2b26f8df17920ad4b550efe45bf8185 -size 223621120 diff --git a/precompiled/qualcomm-qcs8450-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8450-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 2ab1d2793b5ab06026968eb685198631ed9fa2ff..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8450-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e83edc665ecb6441a03f5b9a22bebc74567055dd846608adcb3facbabe24f2c7 -size 111304704 diff --git a/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml deleted file mode 100644 index 651b8e974a8272998a68eb941f388c50bca9eac6..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index e9ce9562e85044090551ab17ae59ff6ec80a564c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:775e604c8aa126be4e8feaad136cf684529419971c54193b82372d0c877f7313 -size 225378304 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 4bdc8b0799cc8b210917dd3af05828444fa35e22..265fef61bd7a57049d341e33fb4e53f2f5ae64a7 100644 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:942d2ad825c8ee376f6a3afac08aea7cf7a85f4512b01b3cb3f6e75c58d2e329 +oid sha256:0c92fbe0d7ada5b3fc7498821d1f12803a2e043b67a01e4e52a4614a8e11b2f5 size 193590896 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 20b9a43527602e8bc9ec6a8f0a47ad915675045b..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e399625ac74cdece9c4215332390ad40f6c95b60fcbf989c0ebbe4d368503c3e -size 112140288 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 9865fe3038f1a01c328b912029953758501c3e5b..cead4e377e914726ad12d30776f7c84d8b32215f 100644 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c01889fc929c33be789b4f6f7db40890176dc6e350390945b0130420ba7e8d63 +oid sha256:701e9e0c513e880ab484bea2fb8d8e513984c8421ed8e5cf7dbe82de1eaf6e13 size 93996909 diff --git a/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..2651df2a5778b3f91e7ee070551106ab67282c06 100644 --- a/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml +++ b/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml @@ -1,4 +1,4 @@ tool_versions: precompiled_qnn_onnx: qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 + onnx_runtime: 1.23.0 diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index ba36322e57e2228ca569cfa60345fd89a64b2ac9..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:17a87c1210a73669160770d96f6a961d371b47107d7cfe22253a40ce0c2adc40 -size 225386496 diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 42c4f82859315c2526e6448511f55a5663f976e5..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f128bc249bbf1d7c20aefb3fd14d3c756d440c13280db413515821ca83bc77e8 -size 111874048 diff --git a/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml deleted file mode 100644 index edfd7276ba749d5e85820422e59493b95251fdbf..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126-auto diff --git a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index 4d322d4ec033421fea25ecf4cc7040db9829c349..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:be9d53a61cd042767ed23fe9a4bd948a55500ec4466241bbe14fd126c916ddff -size 225382400 diff --git a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 2ad842198aaf65e08d6a212a8f4f38c050ddebe4..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d0ae251ada265b7ef935120145f582294d148b0cc1f1287fee1f27440bfd27f4 -size 111763456 diff --git a/precompiled/qualcomm-sa7255p/tool-versions.yaml b/precompiled/qualcomm-sa7255p/tool-versions.yaml deleted file mode 100644 index edfd7276ba749d5e85820422e59493b95251fdbf..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa7255p/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126-auto diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index e9ce9562e85044090551ab17ae59ff6ec80a564c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:775e604c8aa126be4e8feaad136cf684529419971c54193b82372d0c877f7313 -size 225378304 diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 20b9a43527602e8bc9ec6a8f0a47ad915675045b..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e399625ac74cdece9c4215332390ad40f6c95b60fcbf989c0ebbe4d368503c3e -size 112140288 diff --git a/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml deleted file mode 100644 index 651b8e974a8272998a68eb941f388c50bca9eac6..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126 diff --git a/precompiled/qualcomm-sa8295p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8295p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index 886c62a263df07ed4aa11e68b9a7e935fdd8c425..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8295p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5f06ce724e767be088840f779d8f4eed1ba798f0988f7ef05197274aa2c60ae5 -size 223612928 diff --git a/precompiled/qualcomm-sa8295p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8295p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 8bb441abe6263694c4c7f685916971880c8f4586..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8295p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3a001f5170df5123789da48235d533e5ba4cb16ea6ef420a9785b7d19d239a32 -size 111091712 diff --git a/precompiled/qualcomm-sa8295p/tool-versions.yaml b/precompiled/qualcomm-sa8295p/tool-versions.yaml deleted file mode 100644 index edfd7276ba749d5e85820422e59493b95251fdbf..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8295p/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126-auto diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index e9ce9562e85044090551ab17ae59ff6ec80a564c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:775e604c8aa126be4e8feaad136cf684529419971c54193b82372d0c877f7313 -size 225378304 diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 20b9a43527602e8bc9ec6a8f0a47ad915675045b..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e399625ac74cdece9c4215332390ad40f6c95b60fcbf989c0ebbe4d368503c3e -size 112140288 diff --git a/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml deleted file mode 100644 index 651b8e974a8272998a68eb941f388c50bca9eac6..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126 diff --git a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index ba36322e57e2228ca569cfa60345fd89a64b2ac9..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:17a87c1210a73669160770d96f6a961d371b47107d7cfe22253a40ce0c2adc40 -size 225386496 diff --git a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 42c4f82859315c2526e6448511f55a5663f976e5..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f128bc249bbf1d7c20aefb3fd14d3c756d440c13280db413515821ca83bc77e8 -size 111874048 diff --git a/precompiled/qualcomm-sa8775p/tool-versions.yaml b/precompiled/qualcomm-sa8775p/tool-versions.yaml deleted file mode 100644 index edfd7276ba749d5e85820422e59493b95251fdbf..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8775p/tool-versions.yaml +++ /dev/null @@ -1,3 +0,0 @@ -tool_versions: - qnn_context_binary: - qairt: 2.38.0.250901140452_125126-auto diff --git a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index b588d77a74e1425c1ba69ea10754adc2a6c0d0ee..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:10e35e415e36c9fd6892638dc277a7a3dd31743b03c9ab26b3a949b375b84c86 -size 225517568 diff --git a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip deleted file mode 100644 index c5e5811123a1daf548213b531496138f51c47465..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ce962ea1182d2f6e87cb85db46fb996cbeb5ac2841fd18bebab25eaeefdc3523 -size 193634989 diff --git a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index f94367e459b1a0748f3794eebf8d9b4e036f55af..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1ae81f1b393b7134caf3bbed0d76625fe02feabbc8c51a9ea641a4e97a1dc9f5 -size 147673088 diff --git a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip deleted file mode 100644 index 6a437b49197d495cb6b44e1a2ef5d09d0bf5d507..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-7gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:03c5a1cc569e80d4b25dbbf9d08095b905971e91499702ea8adaf433978bea0c -size 110006845 diff --git a/precompiled/qualcomm-snapdragon-7gen5/tool-versions.yaml b/precompiled/qualcomm-snapdragon-7gen5/tool-versions.yaml deleted file mode 100644 index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-7gen5/tool-versions.yaml +++ /dev/null @@ -1,4 +0,0 @@ -tool_versions: - precompiled_qnn_onnx: - qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index b5c221045fe060476481ad584909feee3d865606..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:65caf9a1e53521b4bd7e9be7d82438097abc667f6a49febef89f5ac0714234a9 -size 225320960 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 14ca42e6d2e60142db08a174092b911bfdf51924..a5c6e966c0f619d537e31f1007367b7e86472061 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6d40c060484d09fd330215b13b87141a7a2036a75c63cde8826fd082523f8070 -size 193571496 +oid sha256:7273e24b09e3c471c1e21788ccc1b38795dc37967aa864e94a44c47557b55c0f +size 193571490 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index a10e39f580dd1eb326914119acdc85b2912ee618..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b70bc389551b60bbf67c1b1368ef692309f00e0ec0c2e9753787e167f79474d5 -size 111689728 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index ee27e2987fb2a8ef0c7fa66b24aa272363ca69b8..a43e56aa96188af571ccd8aa5f8e6cd8cca240fa 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:234842104dc3030650759d7cf3fe5f02cd4d350130079014dfabb8146ec36a52 -size 93686222 +oid sha256:7a7e1a44a4f730857843a58a1fe92eff458462d6a54ae2f0c641914a6d630878 +size 93686218 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/tool-versions.yaml index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..2651df2a5778b3f91e7ee070551106ab67282c06 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/tool-versions.yaml +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/tool-versions.yaml @@ -1,4 +1,4 @@ tool_versions: precompiled_qnn_onnx: qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 + onnx_runtime: 1.23.0 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index e6e8aa6bb558057ce3ea1ddfed7808060d6aa1c5..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c484e48f838c5930a8bc5aaa0cb83e9b375ab8078c8bbf68877236c93d6b3902 -size 225484800 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 2f9d48d593fe584606aa2f3346eaee85e1a13f17..5c278736fba7f52a0a2a5fb766d199c6b3e6a086 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7e2952e9582400ad395e5b3a7524481414d8e75191ccced7bd3bd6b60c76082e -size 193623881 +oid sha256:5bdc6ca5660501ab1196792d16ee2b369544776f3b63d4b6b1352e8dcc726d09 +size 193623884 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 80d94069033141959914efcbdf89dac972855424..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ef1bb5b1e010d9d4b2c72457edc793999294cdd804dad1c2a4f7cff94dd570b3 -size 112570368 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 9054b0df740716c5735db885682b395b78d391dd..3b3fd0c57b75f2416c81aac3d6216ddd5c61b9ef 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cc32f3146505fba22c92f7e5a0a4cf1b7de08f91e0c6693aeed473a41aad8bf3 -size 94065502 +oid sha256:0fd02d02ed5433f6dafcb471ff0a4383bcfeeb8a5414630af57683c5dd043c1f +size 94065519 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8-elite-gen5/tool-versions.yaml index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..2651df2a5778b3f91e7ee070551106ab67282c06 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/tool-versions.yaml +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/tool-versions.yaml @@ -1,4 +1,4 @@ tool_versions: precompiled_qnn_onnx: qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 + onnx_runtime: 1.23.0 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index ee21e3dbf34fbe9daeaad20b6c0242c22935ba67..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:de11f65124eddf68a3f121d74051e815c875f13d7b13d4f4aae429edc3c2fb72 -size 225378304 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 18052ceacf4bff875353a097018be27f16d27a35..1a84db21ed8e0cc68b976d53368eb79851a37946 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:997965de328689cbb70b5e0a1937a1d868074df90af03ed96b754bcf29a96762 +oid sha256:930ac9bd8bc475d55a7096eba85a8101a80d31a24c37fd3de8c747ead3d0018a size 193588664 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index ab814e29e24346040340e3da6b5179565002803f..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e13c64ba1420ac8080825085f62c761115f0ff577971162f6e93a6f95966088e -size 111722496 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index c87e0cce0a27b12ef937eb36d3fe384fb5cd95b4..a6d16b83e661cb91d7e52f94c2a4e075c6a19788 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e440c4fdd4a00cb780c36de80f943ce0d9fc04ccecc114e30ea0b287cc005275 +oid sha256:028566a7612a8a7d8194cc8512764e888405e982502dd95f39ce977da7efac32 size 93711026 diff --git a/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..2651df2a5778b3f91e7ee070551106ab67282c06 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml +++ b/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml @@ -1,4 +1,4 @@ tool_versions: precompiled_qnn_onnx: qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 + onnx_runtime: 1.23.0 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin deleted file mode 100644 index d96baf9d23ee82d6858d47aa7bbb016f95e7d886..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:85ba973ec33e6c5bcdb9c6579b7ab572c73df81a39c16b782cf967f0a6d4bb55 -size 225374208 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index f6537ec08afb928a2e5720edefbf1f805ef05770..1fcafb9a92afac45ef4c2a6910b9f65b18a40105 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2c4407250aa75d996934a3f241c35605496fda049bd9cc12d5311fc63ffb23c1 +oid sha256:85e6bb2b9ba765af4a2fd57d90375d753df6e8e0fd89faafb21ba1eb06c70398 size 193589978 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin deleted file mode 100644 index 62fc8ec5ed26b802d5afd7bf9761c28ec4c623b3..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:48fa62c3576c9c19a44ebe80fad379ae8a645417d62bc3fb439a5a3d63277870 -size 112148480 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 19f8bfe5830b5fc9ce23368be874f980a1bbbddc..6ba3bb6f5890436a442a6707b7c8f276da7ec36f 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:83748ce4e7da396adf31bb927f4757143b48e59eda4d679dda5cc3b6e0f16c07 -size 93992296 +oid sha256:1e7afc3e2b35515e74b26c94a265a232436bdd5ca8b9896efd7b3091af1484bd +size 93992314 diff --git a/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml b/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml index da45f7a258efe5ac9b94b5f6d444bf650b0dc651..2651df2a5778b3f91e7ee070551106ab67282c06 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml +++ b/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml @@ -1,4 +1,4 @@ tool_versions: precompiled_qnn_onnx: qairt: 2.37.1.250807093845_124904 - onnx_runtime: 1.22.2 + onnx_runtime: 1.23.0