diff --git a/DEPLOYMENT_MODEL_LICENSE.pdf b/DEPLOYMENT_MODEL_LICENSE.pdf deleted file mode 100644 index 42699872aa2347c5837d291559bcd5eaa302b7ea..0000000000000000000000000000000000000000 --- a/DEPLOYMENT_MODEL_LICENSE.pdf +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4409f93b0e82531303b3e10f52f1fdfb56467a25f05b7441c6bbd8bb8a64b42c -size 109629 diff --git a/LICENSE b/LICENSE index 698c1c0c019be1401276a8b21e1cabd82223a56a..a2a056017d99b57b1611b9022159cc3d3fcac2a5 100644 --- a/LICENSE +++ b/LICENSE @@ -1,2 +1 @@ The license of the original trained model can be found at https://github.com/huggingface/transformers/blob/v4.42.3/LICENSE. -The license for the deployable model files (.tflite, .onnx, .dlc, .bin, etc.) can be found in DEPLOYMENT_MODEL_LICENSE.pdf. diff --git a/README.md b/README.md index 2542b8003d56256186c8c9a901737501500f64be..fb35e64ab54cef75d93aeebcecd160fd875c11fc 100644 --- a/README.md +++ b/README.md @@ -35,44 +35,48 @@ More details on model performance across various devices, can be found | Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model |---|---|---|---|---|---|---|---|---| -| WhisperSmallEncoderQuantizable | w8a16 | Dragonwing RB3 Gen 2 Vision Kit | Qualcomm® QCS6490 | PRECOMPILED_QNN_ONNX | 537.889 ms | 30 - 33 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 458.786 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 353.084 ms | 1 - 3 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 62.712 ms | 0 - 113 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 267.301 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 458.786 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 335.324 ms | 1 - 3 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 330.105 ms | 1 - 2 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 267.301 ms | 1 - 10 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 250.011 ms | 1 - 19 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 44.505 ms | 64 - 82 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | QNN_CONTEXT_BINARY | 202.875 ms | 1 - 14 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 35.201 ms | 63 - 78 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | QNN_CONTEXT_BINARY | 526.452 ms | 3 - 17 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | PRECOMPILED_QNN_ONNX | 183.764 ms | 63 - 77 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | QNN_CONTEXT_BINARY | 179.19 ms | 1 - 11 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 29.961 ms | 62 - 73 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 243.159 ms | 0 - 0 MB | NPU | Use Export Script | -| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 61.68 ms | 107 - 107 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Dragonwing RB3 Gen 2 Vision Kit | Qualcomm® QCS6490 | PRECOMPILED_QNN_ONNX | 32.659 ms | 27 - 59 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 13.485 ms | 29 - 39 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 8.416 ms | 27 - 29 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 8.737 ms | 0 - 193 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 9.562 ms | 27 - 37 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 13.485 ms | 29 - 39 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 8.495 ms | 27 - 29 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 8.279 ms | 34 - 37 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 9.562 ms | 27 - 37 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 6.409 ms | 30 - 49 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 6.785 ms | 38 - 57 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | QNN_CONTEXT_BINARY | 4.763 ms | 21 - 38 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 5.095 ms | 26 - 39 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | QNN_CONTEXT_BINARY | 11.037 ms | 30 - 45 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | PRECOMPILED_QNN_ONNX | 11.94 ms | 30 - 43 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | QNN_CONTEXT_BINARY | 4.012 ms | 30 - 42 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 4.368 ms | 37 - 48 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 7.725 ms | 30 - 30 MB | NPU | Use Export Script | -| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 7.841 ms | 186 - 186 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Dragonwing Q-6690 MTP | Qualcomm® Qcm6690 | QNN_CONTEXT_BINARY | 4274.97 ms | 1 - 14 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Dragonwing Q-6690 MTP | Qualcomm® Qcm6690 | PRECOMPILED_QNN_ONNX | 1576.21 ms | 2 - 16 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Dragonwing RB3 Gen 2 Vision Kit | Qualcomm® QCS6490 | PRECOMPILED_QNN_ONNX | 538.969 ms | 48 - 51 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 463.377 ms | 1 - 9 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 307.27 ms | 1 - 4 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 61.701 ms | 63 - 65 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 270.353 ms | 1 - 10 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 463.377 ms | 1 - 9 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 345.284 ms | 1 - 3 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 331.302 ms | 1 - 3 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 270.353 ms | 1 - 10 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 250.146 ms | 1 - 18 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 45.286 ms | 63 - 82 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | QNN_CONTEXT_BINARY | 207.463 ms | 1 - 17 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 36.987 ms | 63 - 77 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | QNN_CONTEXT_BINARY | 527.982 ms | 0 - 13 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | PRECOMPILED_QNN_ONNX | 187.371 ms | 53 - 63 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | QNN_CONTEXT_BINARY | 197.418 ms | 1 - 12 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 27.177 ms | 62 - 73 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 245.094 ms | 0 - 0 MB | NPU | Use Export Script | +| WhisperSmallEncoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 61.585 ms | 107 - 107 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Dragonwing Q-6690 MTP | Qualcomm® Qcm6690 | QNN_CONTEXT_BINARY | 40.815 ms | 30 - 44 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Dragonwing Q-6690 MTP | Qualcomm® Qcm6690 | PRECOMPILED_QNN_ONNX | 31.387 ms | 39 - 52 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Dragonwing RB3 Gen 2 Vision Kit | Qualcomm® QCS6490 | PRECOMPILED_QNN_ONNX | 31.995 ms | 29 - 62 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 13.519 ms | 26 - 34 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 8.418 ms | 30 - 34 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 8.647 ms | 29 - 31 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 9.426 ms | 25 - 34 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 13.519 ms | 26 - 34 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 8.309 ms | 30 - 33 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 8.365 ms | 30 - 33 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 9.426 ms | 25 - 34 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 6.396 ms | 14 - 32 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 6.819 ms | 38 - 57 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | QNN_CONTEXT_BINARY | 4.744 ms | 28 - 44 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Samsung Galaxy S25 | Snapdragon® 8 Elite For Galaxy Mobile | PRECOMPILED_QNN_ONNX | 5.144 ms | 26 - 37 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | QNN_CONTEXT_BINARY | 11.215 ms | 32 - 46 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 7 Gen 4 QRD | Snapdragon® 7 Gen 4 Mobile | PRECOMPILED_QNN_ONNX | 11.984 ms | 38 - 52 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | QNN_CONTEXT_BINARY | 3.992 ms | 28 - 39 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon 8 Elite Gen 5 QRD | Snapdragon® 8 Elite Gen5 Mobile | PRECOMPILED_QNN_ONNX | 4.418 ms | 36 - 46 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 7.669 ms | 30 - 30 MB | NPU | Use Export Script | +| WhisperSmallDecoderQuantizable | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 7.777 ms | 186 - 186 MB | NPU | Use Export Script | @@ -159,7 +163,6 @@ Explore all available models on [Qualcomm® AI Hub](https://aihub.qualcomm.com/) ## License * The license for the original implementation of Whisper-Small-Quantized can be found [here](https://github.com/huggingface/transformers/blob/v4.42.3/LICENSE). -* The license for the compiled assets for on-device deployment can be found [here](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/Qualcomm+AI+Hub+Proprietary+License.pdf) diff --git a/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin new file mode 100644 index 0000000000000000000000000000000000000000..58a209d9f633f2f716963ca62bb39a1447382abd --- /dev/null +++ b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327e49de3f5eccfc17ad8e57e1da85c1ad54f583d20705495e1dafcb21701cf6 +size 225636352 diff --git a/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..6262709f8b013f4b5ae4a70b9807f35f89c13383 --- /dev/null +++ b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0ac107e9e0624de5cf8d834067a8e8c26c185cb8138d391c3541b68964df2c +size 193700590 diff --git a/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin new file mode 100644 index 0000000000000000000000000000000000000000..27ce6e6f103a8f4fbed7219bf1175f7ee49182d0 --- /dev/null +++ b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9896983d0899141305703f60b387e09d190f3e531d2269f0acb732fa4c557ea5 +size 187011072 diff --git a/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..c1752f6c63e0321a6d546fbb6f30fd2b5696d9ec --- /dev/null +++ b/precompiled/qualcomm-qcm6690/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1576c2abba6350944ea4b913125cf2bc7e9ebdb7e25d635344c8ad5c1559873 +size 101219746 diff --git a/precompiled/qualcomm-qcm6690/tool-versions.yaml b/precompiled/qualcomm-qcm6690/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..2651df2a5778b3f91e7ee070551106ab67282c06 --- /dev/null +++ b/precompiled/qualcomm-qcm6690/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.37.1.250807093845_124904 + onnx_runtime: 1.23.0 diff --git a/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index dbf30e6b27cf0fdf47e58c41f37c98a74d0f2879..700b065bfcb833fa6d9ac55790f69c5a289a0f14 100644 --- a/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:57600c23f629dc4856253125f2247a207654d6c0109847f3cfe77d2aa7294774 -size 193518242 +oid sha256:5d5ae1ce2b117ba20a21b1517046729199a8bdd24c233884547901aed115704d +size 193518277 diff --git a/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 89bce04d72434e86a355d967ff715982f2414c41..50c227c9d8214fd1d8bf072e080bf26b813c9c85 100644 --- a/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs6490/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00219edb3cfbfd14364f2c3324a7c9201e27e12e1a70d265b162f23da1ca831c -size 102104981 +oid sha256:9b61f928340aa452b86362c93f3c793e2765d39cb44a9f7eb5e66d50c687d316 +size 102105014 diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index f934148e368cef66f76fff84804aef5177467ba2..14bff8110f378ed7a438ba2bc1885cb76338fc17 100644 --- a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:24208db19866047ea5ad231d2836f469283e3f637e8b024ff42be251e6c0bdcf -size 225382400 +oid sha256:7f8eb26090b3d6422daa3a666425c30aa5e969ea71ef5b92a5c7ed044d32181c +size 225398784 diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 130190fe3c5c8ac2418a3c32ac2f41e3998f0ec8..49fed2f39876d63a72e12ce6454f5ca1da15651c 100644 --- a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4794729267b57f8d32ce5ba27a3419f395db5c1f02c8d4dbdf3b6f7971004e8d -size 130682880 +oid sha256:3716719e2e4cc9c5392b7c97f6dbcaa6d0edae6ca065b86ce7b1ee1481e6c29e +size 133246976 diff --git a/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml index 4cb4c03408f55902c17ea51b9b055908dfbcac32..e47c5de04aa0a4337b0bdc894a0beb3da86b57c6 100644 --- a/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml +++ b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ tool_versions: qnn_context_binary: - qairt: 2.40.0.251030114326_189385-auto + qairt: 2.41.0.251128145156_191518-auto diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index dec9757ee21ac7ff2dbbf3bc8fb4d8ead27b6957..46a1e3f5c796b9fa31c32c028750e236bf71f11c 100644 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10394e71510154ed77feae4dc48450d289685a1eee515fbd5f5655541c908ef8 -size 225378304 +oid sha256:b14e04ef879365480fc0eaff9e62ad034218a39556aedc5339af70f626ace650 +size 225398784 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 722c575e70d889397c291a62a4e4c5d3e400adfa..836dd5edfeee0db8181780886cdd751da8bab099 100644 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:47054c0afebadfb456f3a5307731b6e85dd20aa6d2c8b01d80f59296cdd65783 -size 193590918 +oid sha256:2743abf41feb89901646354c21d473ca2899d986b1f09c1c00649041db1d26d7 +size 193590953 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 1aa536d8f3e7d2f0a167193a2fac45c35c34e3eb..2fb86d3c4fd38973a2d76f51b3c25b663d593b96 100644 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:79df9e8e3a94e3923bf5ae03a60bf4622e28bdf60153246a9336867655b9664c -size 130580480 +oid sha256:09dc49f9dcceb42232eaf1d3b25db49b85863ef3b9c7128483f6be031766e351 +size 133283840 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 4af299836da35f133cc386289679bd708685b92e..c34f373067766ea8d647f30f3bde2e6ed9a65747 100644 --- a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:127854ee8c90c814a983e5a1cb4faee1a2661d8e4640c99e50b66ca231156225 -size 93996909 +oid sha256:0e1f3c49afa25d840672c732f1b340daf0e094b3556823eb95d26d4aa369ce79 +size 93996941 diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index 2d3188a1e4741562c011c63e2b8cab7d1d83e68b..f60e4fb06634d07a8d06391a65211e19015e78fc 100644 --- a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1843626282087293ceb96dbfe14e5c80689f33b4658c6887092d35b881b0be00 -size 225386496 +oid sha256:614760733160982e6b1bd776f85f0159b5212a7a12b6996e4286d6c823d09640 +size 225402880 diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 141c1a5bbb79584449235818e9b71af982cd726a..177bd0561dd5f15f7f91620700c1021f8f0f49a3 100644 --- a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ef0733e4636f075193280ac4d3c1beabf6b5b6b4603369ce89b7cf726fd39028 -size 130678784 +oid sha256:a5cdc84e13d269451e56965335680e1317dc6d2658949de51c5a10aae416aa94 +size 133292032 diff --git a/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml index 4cb4c03408f55902c17ea51b9b055908dfbcac32..e47c5de04aa0a4337b0bdc894a0beb3da86b57c6 100644 --- a/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml +++ b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ tool_versions: qnn_context_binary: - qairt: 2.40.0.251030114326_189385-auto + qairt: 2.41.0.251128145156_191518-auto diff --git a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index f934148e368cef66f76fff84804aef5177467ba2..14bff8110f378ed7a438ba2bc1885cb76338fc17 100644 --- a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:24208db19866047ea5ad231d2836f469283e3f637e8b024ff42be251e6c0bdcf -size 225382400 +oid sha256:7f8eb26090b3d6422daa3a666425c30aa5e969ea71ef5b92a5c7ed044d32181c +size 225398784 diff --git a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 130190fe3c5c8ac2418a3c32ac2f41e3998f0ec8..49fed2f39876d63a72e12ce6454f5ca1da15651c 100644 --- a/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa7255p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4794729267b57f8d32ce5ba27a3419f395db5c1f02c8d4dbdf3b6f7971004e8d -size 130682880 +oid sha256:3716719e2e4cc9c5392b7c97f6dbcaa6d0edae6ca065b86ce7b1ee1481e6c29e +size 133246976 diff --git a/precompiled/qualcomm-sa7255p/tool-versions.yaml b/precompiled/qualcomm-sa7255p/tool-versions.yaml index 4cb4c03408f55902c17ea51b9b055908dfbcac32..e47c5de04aa0a4337b0bdc894a0beb3da86b57c6 100644 --- a/precompiled/qualcomm-sa7255p/tool-versions.yaml +++ b/precompiled/qualcomm-sa7255p/tool-versions.yaml @@ -1,3 +1,3 @@ tool_versions: qnn_context_binary: - qairt: 2.40.0.251030114326_189385-auto + qairt: 2.41.0.251128145156_191518-auto diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index dec9757ee21ac7ff2dbbf3bc8fb4d8ead27b6957..46a1e3f5c796b9fa31c32c028750e236bf71f11c 100644 --- a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10394e71510154ed77feae4dc48450d289685a1eee515fbd5f5655541c908ef8 -size 225378304 +oid sha256:b14e04ef879365480fc0eaff9e62ad034218a39556aedc5339af70f626ace650 +size 225398784 diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 1aa536d8f3e7d2f0a167193a2fac45c35c34e3eb..2fb86d3c4fd38973a2d76f51b3c25b663d593b96 100644 --- a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:79df9e8e3a94e3923bf5ae03a60bf4622e28bdf60153246a9336867655b9664c -size 130580480 +oid sha256:09dc49f9dcceb42232eaf1d3b25db49b85863ef3b9c7128483f6be031766e351 +size 133283840 diff --git a/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml index dd8b2661f081194cd120bbfbfedc0d2de466fa2d..24628b680cbadb36fea7576eefde7ca39cedf3d5 100644 --- a/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml +++ b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ tool_versions: qnn_context_binary: - qairt: 2.40.0.251030114326_189385 + qairt: 2.41.0.251128145156_191518 diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index dec9757ee21ac7ff2dbbf3bc8fb4d8ead27b6957..46a1e3f5c796b9fa31c32c028750e236bf71f11c 100644 --- a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10394e71510154ed77feae4dc48450d289685a1eee515fbd5f5655541c908ef8 -size 225378304 +oid sha256:b14e04ef879365480fc0eaff9e62ad034218a39556aedc5339af70f626ace650 +size 225398784 diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 1aa536d8f3e7d2f0a167193a2fac45c35c34e3eb..2fb86d3c4fd38973a2d76f51b3c25b663d593b96 100644 --- a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:79df9e8e3a94e3923bf5ae03a60bf4622e28bdf60153246a9336867655b9664c -size 130580480 +oid sha256:09dc49f9dcceb42232eaf1d3b25db49b85863ef3b9c7128483f6be031766e351 +size 133283840 diff --git a/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml index dd8b2661f081194cd120bbfbfedc0d2de466fa2d..24628b680cbadb36fea7576eefde7ca39cedf3d5 100644 --- a/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml +++ b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ tool_versions: qnn_context_binary: - qairt: 2.40.0.251030114326_189385 + qairt: 2.41.0.251128145156_191518 diff --git a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index 2d3188a1e4741562c011c63e2b8cab7d1d83e68b..f60e4fb06634d07a8d06391a65211e19015e78fc 100644 --- a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1843626282087293ceb96dbfe14e5c80689f33b4658c6887092d35b881b0be00 -size 225386496 +oid sha256:614760733160982e6b1bd776f85f0159b5212a7a12b6996e4286d6c823d09640 +size 225402880 diff --git a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 141c1a5bbb79584449235818e9b71af982cd726a..177bd0561dd5f15f7f91620700c1021f8f0f49a3 100644 --- a/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-sa8775p/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ef0733e4636f075193280ac4d3c1beabf6b5b6b4603369ce89b7cf726fd39028 -size 130678784 +oid sha256:a5cdc84e13d269451e56965335680e1317dc6d2658949de51c5a10aae416aa94 +size 133292032 diff --git a/precompiled/qualcomm-sa8775p/tool-versions.yaml b/precompiled/qualcomm-sa8775p/tool-versions.yaml index 4cb4c03408f55902c17ea51b9b055908dfbcac32..e47c5de04aa0a4337b0bdc894a0beb3da86b57c6 100644 --- a/precompiled/qualcomm-sa8775p/tool-versions.yaml +++ b/precompiled/qualcomm-sa8775p/tool-versions.yaml @@ -1,3 +1,3 @@ tool_versions: qnn_context_binary: - qairt: 2.40.0.251030114326_189385-auto + qairt: 2.41.0.251128145156_191518-auto diff --git a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index 7846ccb1250ebed3df30ac161b7c3c222138aafb..a1b7074a1b6508100593f3d178153849233284d8 100644 --- a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c4e5b2c9d14cbd89276b447dafe01c47c469125b1c106581c4975095069d1c0 -size 225513472 +oid sha256:74245f6b7c58877881e8d369ae33dc13d012c56602eaefc8fc5b2beb6cdc2819 +size 225529856 diff --git a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index fa2f886567aa9a1fdeb7b2d6ba231e3a2b151744..cd15e38caaeb10c045b0c9b2bcc4444f32cb3942 100644 --- a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bb1783b340467387cc5d85f83cd80c8dd349cb45a1d96198ac619d89bc0cac02 -size 193634987 +oid sha256:0916b277fb90a3c07dad30bb9beb6c140bcf888acf56edcce7ceafc32c4593a3 +size 193635048 diff --git a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index fc29666e5df091c68e6f3d6f6bc6a550adb68283..7ab7cd17ea04d67180ed8b415c26e83300e3390c 100644 --- a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d77d64e8b1b4f3d7c9646f9bbc9131d594ab70a9b85fab3a5e9b6779e5e5023c -size 145821696 +oid sha256:fad65c8a6005f43d940643ff038c557ebbdbdb43176534649c7f022095247e05 +size 148570112 diff --git a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 412f781ece06e2a24e2f0fa20fac67c8e0c50623..c89cd03c439637b9df1533fcade8a29901514804 100644 --- a/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-7gen4/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c22175c3ad26cb22386a78a5a5054b2daeb175d730eb4bea2f0802fd9a43c43 -size 110006846 +oid sha256:12baef1fe946ce8d744540d1b22d707a1a19eb07bb9224bd5d7d78e212932f91 +size 110006863 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index 4433169a25dd25bc4f416f93f359eb4a400a0f6d..cbee14e5893704401c51389e855b491b683873bf 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:25fe4234de1f21dc4f86e5d9e892eaf408f14353c0c1d9d26f46c7c87d2d699c -size 225320960 +oid sha256:1f8d2b98ec0fa9d9da9b66a08d146cb963a6ac166deb050015c3dd3bebbbb9ae +size 225337344 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 3a4b40d9548d2fc3296747c17b942522641e733d..2af358737e16557b7ee18f87c4cee673135e7621 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4cdb0c0d3d01a30aa44fb67e66c5dea4e1b3f8d2120e585ce007037986ddd18a -size 193571498 +oid sha256:8790539ce7cde56dbe2abdeb0924b98b53d5aef97365f56d4e9f0d3f48c03a81 +size 193571532 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 85feba23142031dfe0414d8a6016f2c013ad60a6..3b5f673308261d1ce50a6bde59ac2c6c04749903 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad0e827e028aa01bc8efd4b4286ec3763f094e580903521a1f4276a3a3d1280d -size 129683456 +oid sha256:a2982c900161091b822c93a9df0015747158a75b1c0d71a66b84752205319e69 +size 132247552 diff --git a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index b829cfd60fbec9ce998b6ec271d022dfc298bd11..55d3f4d1a9d765849db8eb404ebfcbd883f269bd 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-for-galaxy/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f4a744302a5f4b99676d7635a06559c1db1c09fdf8987446d9289c98af6cb6f0 -size 93686223 +oid sha256:347377a0d2ef7eb652daa764da911fe9b9ea7bbbc7e6d600ecbda8fc35117f31 +size 93686254 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index e154d4fd2c9bd8c1f297d1455da4f95533dc92ea..89cb3b1ccf574c155548ee5f8e48fc0360e06b40 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ae8c828515e159b8c6d31acdd6df36a40a2511a48bb7a743e54e9f8fbb399ec -size 225484800 +oid sha256:ba0ab87882d54b304bf0bf571faacf4f4582c1d22d6288254622424c8be9776e +size 225501184 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index db0df890b2dc21e7c81c3d334fc4e25842cd372d..139201a9f1fe47ce70cb2394820228f15ea8b284 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92d4a8126793b548f06288a69a39b254ae66c5cce965e5b4b5b97dbe450cd863 -size 193623918 +oid sha256:83aec4b198ddab15656a6d19fd829da5a8f4751fb736e4030d4c8d269d725e19 +size 193623914 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 6d2669335f3817c4a7e705fc5eacc7dce840729f..f44770a903c12c12740c01287ce78dec421175c8 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68440264fd98da6dff55960c62385e3e7cf8ecf1bcf151eeab3221dba24d7ff4 -size 132378624 +oid sha256:1a06f93abf396762e762e3d23681d21f5f1bf7234b5c7ee1110d3cc1485a713d +size 134934528 diff --git a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 2db794340b53f37dbccf899d4e9b313847bafde3..df19ce4ce43e0a121fff2beddfa322c2de7c02aa 100644 --- a/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8-elite-gen5/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7dcbb02351bf80700db43546fe688ea377b24608d7534f9cf14d25db8876c505 -size 94065502 +oid sha256:60312b0a9da5341fb1abe1a59dc77e59ab1b3def63625b798596b8cab14ae40f +size 94065534 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index d814c5409c3e767f9da36bb3471c8ebd3427f2da..acf461a8e3a1be35b94a7922ce2f911e21bb7053 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2ce55c7368a2022bbef3070e71d2fb52a112f46581b371344cba209081ad7b10 -size 225374208 +oid sha256:37c2192993bfda4acba4348fa9aa51fdf3055c4cf6992a584bfd82f5300d1225 +size 225390592 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 43616cc507b5705997b0bb980345058256c468af..3a329a3ef58cd02bf6e203776b9047ab88dcda12 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9ac956625f5fe8b00e208941c8d49b02900615b5c82abc2cec08d5aaedbbd736 -size 193588683 +oid sha256:1c7a9f9491d6e613cd429a4610a266f3ab536175903c985b4f0817374318b400 +size 193588834 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 88fa350a714108e4334fe98e7d58567d3ac6dc5c..7bda93ea216e0022d57139eaccea957dfa730f85 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7da541c27e91456e766d6d1caeec55075a9353397d74cd0deaf36ab1db6c2183 -size 130445312 +oid sha256:e6550d3ded85ef93542017fd8db5a69d272c486802442adaa47b85900ab1f348 +size 133124096 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index 5334dc91d3cdfe5b272d960da21b69490e96da28..b4cf424efc03a730d758c69e35b74aaa51fe3bde 100644 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e211aa7364781f5978537422f5d254f24ba8257212ea4646688c8c5195bac33d -size 93711025 +oid sha256:e877249f701849ee715838fc1676418aa9de2b32a1b7d9aedaafba1ec981e6b4 +size 93711057 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin index 878fab4f68cd25264f057f44e06d62f1c9106c7c..aa967c8eb1ded7aa499e733e8cb187c92d28d49a 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2c923fdd7d2606ef14af381b451faf9424ab6084840810b4434168a35533fb5f -size 225378304 +oid sha256:5413fd0496a104e4f470f76fef9028f5a6200482bd33f647549065e7f18b69c2 +size 225398784 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip index 402745bb44d924a4967658c482ae539f5fd0d011..4d297e98064baae17f04beebe67d8ce5df091573 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallDecoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aad1deba5891fc49ab797a80a58d16003a6178ccd33c0911331556f59bff53ea -size 193589979 +oid sha256:fad2e0bf28380928ed2f5549ad90a8d3b85bd11484c324ed252ea79904bc4d5c +size 193590013 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin index 0beade924f85fc8e89844f5f097c5decab44c050..2a5024af2f775d4934f6e7f9fd7e3bca5d00a5ad 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e3c2fd6eaaf562d85a24b60017510a58849597abadc416f7684f0ed7692a6522 -size 130580480 +oid sha256:e38113bb8548b9fb53f302fea907551e37eeccaa78f13ac9707adb5e5ec0c257 +size 133283840 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip index e0c13c5135ad93e45c2b009e368547afeb4cefab..506e5f82bdfc9a544b4ab39e2c373e438af93d4f 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small-Quantized_WhisperSmallEncoderQuantizable_w8a16.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:347f1e6317e96a992d619b66ff244e1dfda0776991c4937b3f3df9d872b6a556 -size 93992315 +oid sha256:169994e5c8ee168bff1dfed6df6d444edd22a6bca6bf269fe8c03273bdc8c7b3 +size 93992346