diff --git a/README.md b/README.md index 45597987b91fbb7137f696b928155091b975fb6c..73ac30a5fef7a88d416bf021f402e099dd094750 100644 --- a/README.md +++ b/README.md @@ -42,6 +42,7 @@ More details on model performance across various devices, can be found | HfWhisperEncoder | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 130.662 ms | 1 - 10 MB | NPU | Use Export Script | | HfWhisperEncoder | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_CONTEXT_BINARY | 111.747 ms | 1 - 17 MB | NPU | Use Export Script | | HfWhisperEncoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 43.301 ms | 1 - 3 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 43.665 ms | 0 - 66 MB | NPU | Use Export Script | | HfWhisperEncoder | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 50.193 ms | 1 - 11 MB | NPU | Use Export Script | | HfWhisperEncoder | float | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 130.662 ms | 1 - 10 MB | NPU | Use Export Script | | HfWhisperEncoder | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 43.516 ms | 1 - 2 MB | NPU | Use Export Script | @@ -49,16 +50,17 @@ More details on model performance across various devices, can be found | HfWhisperEncoder | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 43.199 ms | 1 - 3 MB | NPU | Use Export Script | | HfWhisperEncoder | float | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 50.193 ms | 1 - 11 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_CONTEXT_BINARY | 43.355 ms | 1 - 4 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 44.114 ms | 0 - 67 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 44.178 ms | 0 - 66 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 34.042 ms | 1 - 18 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 34.282 ms | 34 - 53 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 33.554 ms | 33 - 51 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_CONTEXT_BINARY | 28.367 ms | 0 - 14 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 29.337 ms | 39 - 52 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 28.453 ms | 38 - 52 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 42.085 ms | 0 - 0 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 42.398 ms | 66 - 66 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 42.491 ms | 67 - 67 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 6.224 ms | 20 - 29 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_CONTEXT_BINARY | 5.156 ms | 20 - 42 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 4.053 ms | 20 - 22 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 4.474 ms | 0 - 142 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 4.663 ms | 20 - 30 MB | NPU | Use Export Script | | HfWhisperDecoder | float | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 6.224 ms | 20 - 29 MB | NPU | Use Export Script | | HfWhisperDecoder | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 3.858 ms | 20 - 22 MB | NPU | Use Export Script | @@ -66,13 +68,13 @@ More details on model performance across various devices, can be found | HfWhisperDecoder | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 3.982 ms | 19 - 21 MB | NPU | Use Export Script | | HfWhisperDecoder | float | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 4.663 ms | 20 - 30 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_CONTEXT_BINARY | 3.951 ms | 19 - 21 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 4.654 ms | 0 - 143 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 4.203 ms | 20 - 22 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 3.142 ms | 0 - 19 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 3.662 ms | 26 - 46 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 3.575 ms | 26 - 46 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_CONTEXT_BINARY | 2.638 ms | 18 - 32 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 3.068 ms | 17 - 31 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 3.032 ms | 18 - 32 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 3.458 ms | 20 - 20 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 3.681 ms | 125 - 125 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 3.476 ms | 125 - 125 MB | NPU | Use Export Script | diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs8275-proxy/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs8275-proxy/sdk_versions.yml b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-qcs8275-proxy/sdk_versions.yml rename to precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-qcs8275-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs8450-proxy/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8255p-proxy/sdk_versions.yml b/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml similarity index 80% rename from precompiled/qualcomm-sa8255p-proxy/sdk_versions.yml rename to precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml index 645a4ba899019438314a76813152c259f4f74b92..bb24388e3ba98d34090587000fa8f77ca5b64cf0 100644 --- a/precompiled/qualcomm-sa8255p-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..65374c7af30e0dd579c2f56f0bc6abda6d226e4d --- /dev/null +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816a7e8c22b3e27e166f9118a5c56074334f517fb51087e748d49355a5d461e5 +size 137233744 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..e6cc5b6d5db91ada1fdeb845a67344711091dd5e --- /dev/null +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Base_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abf00457e1481a6698be756ada627efda30a121dd42cb6e90c038c297f7a081d +size 47059814 diff --git a/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs9075-proxy/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa7255p/sdk_versions.yml b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-sa7255p/sdk_versions.yml rename to precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-sa7255p/sdk_versions.yml +++ b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa7255p/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8295p/sdk_versions.yml b/precompiled/qualcomm-sa7255p/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-sa8295p/sdk_versions.yml rename to precompiled/qualcomm-sa7255p/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-sa8295p/sdk_versions.yml +++ b/precompiled/qualcomm-sa7255p/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8255p-proxy/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs8450-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml similarity index 80% rename from precompiled/qualcomm-qcs8450-proxy/sdk_versions.yml rename to precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml index 645a4ba899019438314a76813152c259f4f74b92..bb24388e3ba98d34090587000fa8f77ca5b64cf0 100644 --- a/precompiled/qualcomm-qcs8450-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8295p/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs9075-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8295p/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-qcs9075-proxy/sdk_versions.yml rename to precompiled/qualcomm-sa8295p/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-qcs9075-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-sa8295p/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8650p-proxy/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8650p-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8650p-proxy/sdk_versions.yml deleted file mode 100644 index 645a4ba899019438314a76813152c259f4f74b92..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8650p-proxy/sdk_versions.yml +++ /dev/null @@ -1,3 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-qcs8550-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml similarity index 80% rename from precompiled/qualcomm-qcs8550-proxy/sdk_versions.yml rename to precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml index 645a4ba899019438314a76813152c259f4f74b92..bb24388e3ba98d34090587000fa8f77ca5b64cf0 100644 --- a/precompiled/qualcomm-qcs8550-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8775p/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8775p/sdk_versions.yml b/precompiled/qualcomm-sa8775p/sdk_versions.yml deleted file mode 100644 index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8775p/sdk_versions.yml +++ /dev/null @@ -1,3 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa8775p/tool-versions.yaml b/precompiled/qualcomm-sa8775p/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f83be1ae234292df6b302b536309cbf56a9598b0 --- /dev/null +++ b/precompiled/qualcomm-sa8775p/tool-versions.yaml @@ -0,0 +1,3 @@ +tool_versions: + qnn_context_binary: + qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder.onnx.zip deleted file mode 100644 index 52fa5776b8cf7344ef506652c806762d868f52d9..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:db3711e486e2619a098b3360509e5480102f4a40dc9314f505a91cfeb9bb4487 -size 137249025 diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..34661f35f91037a6c22e90e30febb855cb0d2d01 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:641f8d531fd02939db617dccfcb64843c421e7eb0a23c5995feb6f29e219ffec +size 137225805 diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder.onnx.zip deleted file mode 100644 index 80aab96d98227eb1b63109ca0856c3f7fb68de61..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:568fb19b243097c66bb87c157d5a3fff7349b6da47a1ec03d2ba892023bda7c5 -size 46961022 diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..c56c40ef950f915c3b3f1eefa9a8de9d681f93a7 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b254c99506c79689f589ea238e62e0c866c05a09c3625a0eea3efc542f129c8d +size 46960730 diff --git a/precompiled/qualcomm-snapdragon-8-elite/sdk_versions.yml b/precompiled/qualcomm-snapdragon-8-elite/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8-elite/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8-elite/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8-elite/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder.onnx.zip deleted file mode 100644 index 297f1357e40ccc40c929fc20d031291f5e01402f..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:802a4a9cf2671ba673ae50330950db551c2a4c83ef49c335566c451bd049cc76 -size 137259933 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..d420871c0058201150ec17874f6fed5f75434d10 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01dba04537c77fcd22dd1c2055cb752dde1ab46a67793906702135213d5c9b63 +size 137233734 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder.onnx.zip deleted file mode 100644 index afcfcd45718f5485c2d8b6ca43c3fad57e5ff56b..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fd91f41d7197d5aaec977ddca0269caf8fb83dc7406136bb78ea2721759cba1f -size 47059025 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..ae5ffaa3dcc0c9c00493d41dcb5334009853a487 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Base_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3584b8ea570eb6f3422e97357f04e89aa4f02e0b382a6658f5021c5f267f0b9 +size 47059814 diff --git a/precompiled/qualcomm-snapdragon-8gen2/sdk_versions.yml b/precompiled/qualcomm-snapdragon-8gen2/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen2/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen2/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8gen2/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen2/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder.onnx.zip deleted file mode 100644 index d92c7aec8d5388f2072c5a403889883557fdd22b..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8aeec271119dc14cf73c352f81e5af6a14d8f925e3152a5deeedf1c07bff8061 -size 137260170 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..5fe55948c039c07d5c55b1c8e704b3e60d8d751e --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4936f8441d076005adbeeb2f29b472a37beb1ba44789e3033f2eeac69ec817c4 +size 137235108 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder.onnx.zip deleted file mode 100644 index d3c7ae1ed555960389d4398d2f02b9e2b7cc885d..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:97aad034a5125124bccd150da53622656e2477c6e722f3077c0ed237437e6389 -size 47012766 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..f748ad818c8fe7c1cab7d584da78df886fc7fbd7 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Base_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:462615fcefa69f031cb4544ff991d8e052f19a032f57acc76c11216540714470 +size 47005541 diff --git a/precompiled/qualcomm-snapdragon-8gen3/sdk_versions.yml b/precompiled/qualcomm-snapdragon-8gen3/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder.onnx.zip deleted file mode 100644 index 622211594b14dc7bb190e1ff5adba4db36686621..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:212d91ba86887971cd98fc13a82e66b3829cbae1c92d6c4b0ff4467d688b1ab9 -size 137259315 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip index 622211594b14dc7bb190e1ff5adba4db36686621..9a3fae9e95dfb13fd89e9726119c0b95105faa7d 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperDecoder_float.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:212d91ba86887971cd98fc13a82e66b3829cbae1c92d6c4b0ff4467d688b1ab9 -size 137259315 +oid sha256:5fb368e96ff013ea354a05207d79646209c16fc26bdb210ce7cf32d472d578af +size 272 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder.onnx.zip deleted file mode 100644 index a1aa19bb2fc8c6aec6e8920df81bed2dc8081fca..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6c3adc6079c35b10558934f238d44c73275d102bf1eb74e544206739ad2e267d -size 47065616 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip index a1aa19bb2fc8c6aec6e8920df81bed2dc8081fca..746b77e477cb7b3bcc4c9db8936fc4a723fbc7c0 100644 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Base_HfWhisperEncoder_float.onnx.zip @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c3adc6079c35b10558934f238d44c73275d102bf1eb74e544206739ad2e267d -size 47065616 +oid sha256:76fa1befb43aae375ab332f5c504f6f34f48a9eecdcb511fbc7b829340b81573 +size 270 diff --git a/precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml b/precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml b/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0