v0.53.0
Browse filesSee https://github.com/qualcomm/ai-hub-models/releases/v0.53.0 for changelog.
- README.md +128 -99
- release_assets.json +19 -19
README.md
CHANGED
|
@@ -29,14 +29,14 @@ Below are pre-exported model assets ready for deployment.
|
|
| 29 |
|
| 30 |
| Runtime | Precision | Chipset | SDK Versions | Download |
|
| 31 |
|---|---|---|---|---|
|
| 32 |
-
| ONNX | float | Universal | QAIRT 2.42, ONNX Runtime 1.24.3 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 33 |
-
| ONNX | w8a16 | Universal | QAIRT 2.42, ONNX Runtime 1.24.3 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 34 |
-
| ONNX | w8a8 | Universal | QAIRT 2.42, ONNX Runtime 1.24.3 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 35 |
-
| QNN_DLC | float | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 36 |
-
| QNN_DLC | w8a16 | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 37 |
-
| QNN_DLC | w8a8 | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 38 |
-
| TFLITE | float | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 39 |
-
| TFLITE | w8a8 | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 40 |
|
| 41 |
For more device-specific assets and performance metrics, visit **[GPUNet on Qualcomm® AI Hub](https://aihub.qualcomm.com/models/gpunet)**.
|
| 42 |
|
|
@@ -66,98 +66,127 @@ See our repository for [GPUNet on GitHub](https://github.com/qualcomm/ai-hub-mod
|
|
| 66 |
## Performance Summary
|
| 67 |
| Model | Runtime | Precision | Chipset | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit
|
| 68 |
|---|---|---|---|---|---|---
|
| 69 |
-
| GPUNet | ONNX | float | Snapdragon® 8 Elite Gen 5 Mobile | 0.
|
| 70 |
-
| GPUNet | ONNX | float | Snapdragon®
|
| 71 |
-
| GPUNet | ONNX | float | Snapdragon®
|
| 72 |
-
| GPUNet | ONNX | float | Snapdragon®
|
| 73 |
-
| GPUNet | ONNX | float |
|
| 74 |
-
| GPUNet | ONNX | float |
|
| 75 |
-
| GPUNet | ONNX | float |
|
| 76 |
-
| GPUNet | ONNX |
|
| 77 |
-
| GPUNet | ONNX |
|
| 78 |
-
| GPUNet | ONNX | w8a16 | Snapdragon®
|
| 79 |
-
| GPUNet | ONNX | w8a16 | Snapdragon® 8
|
| 80 |
-
| GPUNet | ONNX | w8a16 |
|
| 81 |
-
| GPUNet | ONNX | w8a16 |
|
| 82 |
-
| GPUNet | ONNX | w8a16 |
|
| 83 |
-
| GPUNet | ONNX | w8a16 |
|
| 84 |
-
| GPUNet | ONNX | w8a16 |
|
| 85 |
-
| GPUNet | ONNX | w8a16 |
|
| 86 |
-
| GPUNet | ONNX |
|
| 87 |
-
| GPUNet | ONNX |
|
| 88 |
-
| GPUNet | ONNX |
|
| 89 |
-
| GPUNet | ONNX |
|
| 90 |
-
| GPUNet | ONNX |
|
| 91 |
-
| GPUNet | ONNX | w8a8 |
|
| 92 |
-
| GPUNet | ONNX | w8a8 |
|
| 93 |
-
| GPUNet | ONNX | w8a8 |
|
| 94 |
-
| GPUNet | ONNX | w8a8 | Snapdragon®
|
| 95 |
-
| GPUNet | ONNX | w8a8 | Snapdragon®
|
| 96 |
-
| GPUNet |
|
| 97 |
-
| GPUNet |
|
| 98 |
-
| GPUNet |
|
| 99 |
-
| GPUNet |
|
| 100 |
-
| GPUNet |
|
| 101 |
-
| GPUNet |
|
| 102 |
-
| GPUNet |
|
| 103 |
-
| GPUNet |
|
| 104 |
-
| GPUNet | QNN_DLC | float |
|
| 105 |
-
| GPUNet | QNN_DLC | float |
|
| 106 |
-
| GPUNet | QNN_DLC | float |
|
| 107 |
-
| GPUNet | QNN_DLC | float | Snapdragon®
|
| 108 |
-
| GPUNet | QNN_DLC |
|
| 109 |
-
| GPUNet | QNN_DLC |
|
| 110 |
-
| GPUNet | QNN_DLC |
|
| 111 |
-
| GPUNet | QNN_DLC |
|
| 112 |
-
| GPUNet | QNN_DLC |
|
| 113 |
-
| GPUNet | QNN_DLC |
|
| 114 |
-
| GPUNet | QNN_DLC |
|
| 115 |
-
| GPUNet | QNN_DLC |
|
| 116 |
-
| GPUNet | QNN_DLC |
|
| 117 |
-
| GPUNet | QNN_DLC |
|
| 118 |
-
| GPUNet | QNN_DLC |
|
| 119 |
-
| GPUNet | QNN_DLC |
|
| 120 |
-
| GPUNet | QNN_DLC | w8a16 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 121 |
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 8 Elite For Galaxy Mobile | 0.522 ms | 0 - 41 MB | NPU
|
| 122 |
-
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 7 Gen 4 Mobile | 1.
|
| 123 |
-
| GPUNet | QNN_DLC |
|
| 124 |
-
| GPUNet | QNN_DLC | w8a8 | Snapdragon®
|
| 125 |
-
| GPUNet | QNN_DLC | w8a8 | Snapdragon®
|
| 126 |
-
| GPUNet | QNN_DLC | w8a8 | Snapdragon®
|
| 127 |
-
| GPUNet | QNN_DLC | w8a8 |
|
| 128 |
-
| GPUNet | QNN_DLC | w8a8 |
|
| 129 |
-
| GPUNet | QNN_DLC | w8a8 |
|
| 130 |
-
| GPUNet | QNN_DLC | w8a8 | Qualcomm®
|
| 131 |
-
| GPUNet | QNN_DLC | w8a8 | Qualcomm®
|
| 132 |
-
| GPUNet | QNN_DLC | w8a8 | Qualcomm®
|
| 133 |
-
| GPUNet | QNN_DLC | w8a8 | Qualcomm®
|
| 134 |
-
| GPUNet | QNN_DLC | w8a8 | Qualcomm®
|
| 135 |
-
| GPUNet | QNN_DLC | w8a8 | Qualcomm®
|
| 136 |
-
| GPUNet | QNN_DLC | w8a8 |
|
| 137 |
-
| GPUNet | QNN_DLC | w8a8 |
|
| 138 |
-
| GPUNet |
|
| 139 |
-
| GPUNet |
|
| 140 |
-
| GPUNet |
|
| 141 |
-
| GPUNet |
|
| 142 |
-
| GPUNet |
|
| 143 |
-
| GPUNet |
|
| 144 |
-
| GPUNet | TFLITE | float |
|
| 145 |
-
| GPUNet | TFLITE | float |
|
| 146 |
-
| GPUNet | TFLITE | float |
|
| 147 |
-
| GPUNet | TFLITE | float |
|
| 148 |
-
| GPUNet | TFLITE |
|
| 149 |
-
| GPUNet | TFLITE |
|
| 150 |
-
| GPUNet | TFLITE |
|
| 151 |
-
| GPUNet | TFLITE |
|
| 152 |
-
| GPUNet | TFLITE |
|
| 153 |
-
| GPUNet | TFLITE |
|
| 154 |
-
| GPUNet | TFLITE |
|
| 155 |
-
| GPUNet | TFLITE |
|
| 156 |
-
| GPUNet | TFLITE |
|
| 157 |
-
| GPUNet | TFLITE | w8a8 |
|
| 158 |
-
| GPUNet | TFLITE | w8a8 |
|
| 159 |
-
| GPUNet | TFLITE | w8a8 | Snapdragon® 8
|
| 160 |
-
| GPUNet | TFLITE | w8a8 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 161 |
|
| 162 |
## License
|
| 163 |
* The license for the original implementation of GPUNet can be found
|
|
|
|
| 29 |
|
| 30 |
| Runtime | Precision | Chipset | SDK Versions | Download |
|
| 31 |
|---|---|---|---|---|
|
| 32 |
+
| ONNX | float | Universal | QAIRT 2.42, ONNX Runtime 1.24.3 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-onnx-float.zip)
|
| 33 |
+
| ONNX | w8a16 | Universal | QAIRT 2.42, ONNX Runtime 1.24.3 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-onnx-w8a16.zip)
|
| 34 |
+
| ONNX | w8a8 | Universal | QAIRT 2.42, ONNX Runtime 1.24.3 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-onnx-w8a8.zip)
|
| 35 |
+
| QNN_DLC | float | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-qnn_dlc-float.zip)
|
| 36 |
+
| QNN_DLC | w8a16 | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-qnn_dlc-w8a16.zip)
|
| 37 |
+
| QNN_DLC | w8a8 | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-qnn_dlc-w8a8.zip)
|
| 38 |
+
| TFLITE | float | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-tflite-float.zip)
|
| 39 |
+
| TFLITE | w8a8 | Universal | QAIRT 2.45 | [Download](https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-tflite-w8a8.zip)
|
| 40 |
|
| 41 |
For more device-specific assets and performance metrics, visit **[GPUNet on Qualcomm® AI Hub](https://aihub.qualcomm.com/models/gpunet)**.
|
| 42 |
|
|
|
|
| 66 |
## Performance Summary
|
| 67 |
| Model | Runtime | Precision | Chipset | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit
|
| 68 |
|---|---|---|---|---|---|---
|
| 69 |
+
| GPUNet | ONNX | float | Snapdragon® 8 Elite Gen 5 Mobile | 0.503 ms | 0 - 36 MB | NPU
|
| 70 |
+
| GPUNet | ONNX | float | Snapdragon® 8 Elite Mobile | 0.605 ms | 0 - 36 MB | NPU
|
| 71 |
+
| GPUNet | ONNX | float | Snapdragon® X2 Elite | 0.483 ms | 24 - 24 MB | NPU
|
| 72 |
+
| GPUNet | ONNX | float | Snapdragon® X Elite | 1.149 ms | 24 - 24 MB | NPU
|
| 73 |
+
| GPUNet | ONNX | float | Snapdragon® X Elite | 1.149 ms | 24 - 24 MB | NPU
|
| 74 |
+
| GPUNet | ONNX | float | Snapdragon® 8 Gen 3 Mobile | 0.778 ms | 0 - 62 MB | NPU
|
| 75 |
+
| GPUNet | ONNX | float | Qualcomm® QCS8550 (Proxy) | 1.039 ms | 0 - 2 MB | NPU
|
| 76 |
+
| GPUNet | ONNX | float | Qualcomm® QCS9075 | 1.353 ms | 1 - 3 MB | NPU
|
| 77 |
+
| GPUNet | ONNX | float | Snapdragon® 8 Elite For Galaxy Mobile | 0.605 ms | 0 - 36 MB | NPU
|
| 78 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® 8 Elite Gen 5 Mobile | 0.355 ms | 0 - 48 MB | NPU
|
| 79 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® 8 Elite Mobile | 0.433 ms | 0 - 42 MB | NPU
|
| 80 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® X2 Elite | 0.384 ms | 12 - 12 MB | NPU
|
| 81 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® X Elite | 0.974 ms | 12 - 12 MB | NPU
|
| 82 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® X Elite | 0.974 ms | 12 - 12 MB | NPU
|
| 83 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® 8 Gen 3 Mobile | 0.6 ms | 0 - 61 MB | NPU
|
| 84 |
+
| GPUNet | ONNX | w8a16 | Qualcomm® QCS6490 | 98.025 ms | 25 - 33 MB | CPU
|
| 85 |
+
| GPUNet | ONNX | w8a16 | Qualcomm® QCS8550 (Proxy) | 0.825 ms | 0 - 16 MB | NPU
|
| 86 |
+
| GPUNet | ONNX | w8a16 | Qualcomm® QCS9075 | 0.98 ms | 0 - 3 MB | NPU
|
| 87 |
+
| GPUNet | ONNX | w8a16 | Qualcomm® QCM6690 | 49.714 ms | 29 - 37 MB | CPU
|
| 88 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® 8 Elite For Galaxy Mobile | 0.433 ms | 0 - 42 MB | NPU
|
| 89 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® 7 Gen 4 Mobile | 38.185 ms | 29 - 37 MB | CPU
|
| 90 |
+
| GPUNet | ONNX | w8a16 | Snapdragon® 7 Gen 4 Mobile | 38.185 ms | 29 - 37 MB | CPU
|
| 91 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® 8 Elite Gen 5 Mobile | 0.358 ms | 0 - 48 MB | NPU
|
| 92 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® 8 Elite Mobile | 0.395 ms | 0 - 44 MB | NPU
|
| 93 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® X2 Elite | 0.308 ms | 12 - 12 MB | NPU
|
| 94 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® X Elite | 0.722 ms | 12 - 12 MB | NPU
|
| 95 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® X Elite | 0.722 ms | 12 - 12 MB | NPU
|
| 96 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® 8 Gen 3 Mobile | 0.462 ms | 0 - 62 MB | NPU
|
| 97 |
+
| GPUNet | ONNX | w8a8 | Qualcomm® QCS6490 | 16.619 ms | 1 - 14 MB | CPU
|
| 98 |
+
| GPUNet | ONNX | w8a8 | Qualcomm® QCS8550 (Proxy) | 0.616 ms | 0 - 22 MB | NPU
|
| 99 |
+
| GPUNet | ONNX | w8a8 | Qualcomm® QCS9075 | 0.723 ms | 0 - 3 MB | NPU
|
| 100 |
+
| GPUNet | ONNX | w8a8 | Qualcomm® QCM6690 | 10.202 ms | 7 - 15 MB | CPU
|
| 101 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® 8 Elite For Galaxy Mobile | 0.395 ms | 0 - 44 MB | NPU
|
| 102 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® 7 Gen 4 Mobile | 7.765 ms | 7 - 16 MB | CPU
|
| 103 |
+
| GPUNet | ONNX | w8a8 | Snapdragon® 7 Gen 4 Mobile | 7.765 ms | 7 - 16 MB | CPU
|
| 104 |
+
| GPUNet | QNN_DLC | float | Snapdragon® 8 Elite Gen 5 Mobile | 0.567 ms | 1 - 35 MB | NPU
|
| 105 |
+
| GPUNet | QNN_DLC | float | Snapdragon® 8 Elite Mobile | 0.711 ms | 0 - 30 MB | NPU
|
| 106 |
+
| GPUNet | QNN_DLC | float | Snapdragon® X2 Elite | 0.648 ms | 1 - 1 MB | NPU
|
| 107 |
+
| GPUNet | QNN_DLC | float | Snapdragon® X Elite | 1.4 ms | 1 - 1 MB | NPU
|
| 108 |
+
| GPUNet | QNN_DLC | float | Snapdragon® X Elite | 1.4 ms | 1 - 1 MB | NPU
|
| 109 |
+
| GPUNet | QNN_DLC | float | Snapdragon® 8 Gen 3 Mobile | 0.917 ms | 0 - 56 MB | NPU
|
| 110 |
+
| GPUNet | QNN_DLC | float | Qualcomm® QCS8275 (Proxy) | 4.684 ms | 0 - 30 MB | NPU
|
| 111 |
+
| GPUNet | QNN_DLC | float | Qualcomm® QCS8550 (Proxy) | 1.271 ms | 0 - 6 MB | NPU
|
| 112 |
+
| GPUNet | QNN_DLC | float | Qualcomm® SA8775P | 1.718 ms | 1 - 33 MB | NPU
|
| 113 |
+
| GPUNet | QNN_DLC | float | Qualcomm® SA8775P | 1.718 ms | 1 - 33 MB | NPU
|
| 114 |
+
| GPUNet | QNN_DLC | float | Qualcomm® SA8775P | 1.718 ms | 1 - 33 MB | NPU
|
| 115 |
+
| GPUNet | QNN_DLC | float | Qualcomm® QCS9075 | 1.572 ms | 1 - 3 MB | NPU
|
| 116 |
+
| GPUNet | QNN_DLC | float | Qualcomm® QCS8450 (Proxy) | 2.416 ms | 0 - 62 MB | NPU
|
| 117 |
+
| GPUNet | QNN_DLC | float | Qualcomm® SA7255P | 4.684 ms | 0 - 30 MB | NPU
|
| 118 |
+
| GPUNet | QNN_DLC | float | Qualcomm® SA8295P | 2.286 ms | 0 - 32 MB | NPU
|
| 119 |
+
| GPUNet | QNN_DLC | float | Snapdragon® 8 Elite For Galaxy Mobile | 0.711 ms | 0 - 30 MB | NPU
|
| 120 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 8 Elite Gen 5 Mobile | 0.432 ms | 0 - 44 MB | NPU
|
| 121 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 8 Elite Mobile | 0.522 ms | 0 - 41 MB | NPU
|
| 122 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® X2 Elite | 0.558 ms | 0 - 0 MB | NPU
|
| 123 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® X Elite | 1.239 ms | 0 - 0 MB | NPU
|
| 124 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® X Elite | 1.239 ms | 0 - 0 MB | NPU
|
| 125 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 8 Gen 3 Mobile | 0.765 ms | 0 - 58 MB | NPU
|
| 126 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® QCS6490 | 3.256 ms | 0 - 2 MB | NPU
|
| 127 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® QCS8275 (Proxy) | 2.452 ms | 0 - 42 MB | NPU
|
| 128 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® QCS8550 (Proxy) | 1.069 ms | 0 - 2 MB | NPU
|
| 129 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® SA8775P | 1.272 ms | 0 - 44 MB | NPU
|
| 130 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® SA8775P | 1.272 ms | 0 - 44 MB | NPU
|
| 131 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® SA8775P | 1.272 ms | 0 - 44 MB | NPU
|
| 132 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® QCS9075 | 1.228 ms | 2 - 4 MB | NPU
|
| 133 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® QCM6690 | 6.511 ms | 0 - 165 MB | NPU
|
| 134 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® QCS8450 (Proxy) | 1.431 ms | 0 - 61 MB | NPU
|
| 135 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® SA7255P | 2.452 ms | 0 - 42 MB | NPU
|
| 136 |
+
| GPUNet | QNN_DLC | w8a16 | Qualcomm® SA8295P | 1.678 ms | 0 - 39 MB | NPU
|
| 137 |
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 8 Elite For Galaxy Mobile | 0.522 ms | 0 - 41 MB | NPU
|
| 138 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 7 Gen 4 Mobile | 1.287 ms | 0 - 43 MB | NPU
|
| 139 |
+
| GPUNet | QNN_DLC | w8a16 | Snapdragon® 7 Gen 4 Mobile | 1.287 ms | 0 - 43 MB | NPU
|
| 140 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® 8 Elite Gen 5 Mobile | 0.295 ms | 0 - 44 MB | NPU
|
| 141 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® 8 Elite Mobile | 0.339 ms | 0 - 37 MB | NPU
|
| 142 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® X2 Elite | 0.347 ms | 0 - 0 MB | NPU
|
| 143 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® X Elite | 0.712 ms | 0 - 0 MB | NPU
|
| 144 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® X Elite | 0.712 ms | 0 - 0 MB | NPU
|
| 145 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® 8 Gen 3 Mobile | 0.462 ms | 0 - 55 MB | NPU
|
| 146 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® QCS6490 | 2.005 ms | 2 - 4 MB | NPU
|
| 147 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® QCS8275 (Proxy) | 1.415 ms | 0 - 38 MB | NPU
|
| 148 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® QCS8550 (Proxy) | 0.611 ms | 0 - 2 MB | NPU
|
| 149 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® SA8775P | 0.798 ms | 0 - 40 MB | NPU
|
| 150 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® SA8775P | 0.798 ms | 0 - 40 MB | NPU
|
| 151 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® SA8775P | 0.798 ms | 0 - 40 MB | NPU
|
| 152 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® QCS9075 | 0.691 ms | 2 - 4 MB | NPU
|
| 153 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® QCM6690 | 3.502 ms | 0 - 42 MB | NPU
|
| 154 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® QCS8450 (Proxy) | 0.857 ms | 0 - 58 MB | NPU
|
| 155 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® SA7255P | 1.415 ms | 0 - 38 MB | NPU
|
| 156 |
+
| GPUNet | QNN_DLC | w8a8 | Qualcomm® SA8295P | 1.123 ms | 0 - 37 MB | NPU
|
| 157 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® 8 Elite For Galaxy Mobile | 0.339 ms | 0 - 37 MB | NPU
|
| 158 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® 7 Gen 4 Mobile | 0.783 ms | 0 - 40 MB | NPU
|
| 159 |
+
| GPUNet | QNN_DLC | w8a8 | Snapdragon® 7 Gen 4 Mobile | 0.783 ms | 0 - 40 MB | NPU
|
| 160 |
+
| GPUNet | TFLITE | float | Snapdragon® 8 Elite Gen 5 Mobile | 0.559 ms | 0 - 47 MB | NPU
|
| 161 |
+
| GPUNet | TFLITE | float | Snapdragon® 8 Elite Mobile | 0.698 ms | 0 - 42 MB | NPU
|
| 162 |
+
| GPUNet | TFLITE | float | Snapdragon® 8 Gen 3 Mobile | 0.903 ms | 0 - 74 MB | NPU
|
| 163 |
+
| GPUNet | TFLITE | float | Qualcomm® QCS8275 (Proxy) | 4.739 ms | 0 - 43 MB | NPU
|
| 164 |
+
| GPUNet | TFLITE | float | Qualcomm® QCS8550 (Proxy) | 1.263 ms | 0 - 31 MB | NPU
|
| 165 |
+
| GPUNet | TFLITE | float | Qualcomm® SA8775P | 1.754 ms | 0 - 46 MB | NPU
|
| 166 |
+
| GPUNet | TFLITE | float | Qualcomm® SA8775P | 1.754 ms | 0 - 46 MB | NPU
|
| 167 |
+
| GPUNet | TFLITE | float | Qualcomm® SA8775P | 1.754 ms | 0 - 46 MB | NPU
|
| 168 |
+
| GPUNet | TFLITE | float | Qualcomm® QCS9075 | 1.576 ms | 0 - 27 MB | NPU
|
| 169 |
+
| GPUNet | TFLITE | float | Qualcomm® QCS8450 (Proxy) | 2.41 ms | 0 - 79 MB | NPU
|
| 170 |
+
| GPUNet | TFLITE | float | Qualcomm® SA7255P | 4.739 ms | 0 - 43 MB | NPU
|
| 171 |
+
| GPUNet | TFLITE | float | Qualcomm® SA8295P | 2.264 ms | 0 - 44 MB | NPU
|
| 172 |
+
| GPUNet | TFLITE | float | Snapdragon® 8 Elite For Galaxy Mobile | 0.698 ms | 0 - 42 MB | NPU
|
| 173 |
+
| GPUNet | TFLITE | w8a8 | Snapdragon® 8 Elite Gen 5 Mobile | 0.237 ms | 0 - 45 MB | NPU
|
| 174 |
+
| GPUNet | TFLITE | w8a8 | Snapdragon® 8 Elite Mobile | 0.274 ms | 0 - 39 MB | NPU
|
| 175 |
+
| GPUNet | TFLITE | w8a8 | Snapdragon® 8 Gen 3 Mobile | 0.344 ms | 0 - 55 MB | NPU
|
| 176 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® QCS6490 | 1.583 ms | 0 - 15 MB | NPU
|
| 177 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® QCS8275 (Proxy) | 1.119 ms | 0 - 39 MB | NPU
|
| 178 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® QCS8550 (Proxy) | 0.43 ms | 0 - 2 MB | NPU
|
| 179 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® SA8775P | 0.63 ms | 0 - 42 MB | NPU
|
| 180 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® SA8775P | 0.63 ms | 0 - 42 MB | NPU
|
| 181 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® SA8775P | 0.63 ms | 0 - 42 MB | NPU
|
| 182 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® QCS9075 | 0.529 ms | 0 - 14 MB | NPU
|
| 183 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® QCM6690 | 3.051 ms | 0 - 41 MB | NPU
|
| 184 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® QCS8450 (Proxy) | 0.687 ms | 0 - 57 MB | NPU
|
| 185 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® SA7255P | 1.119 ms | 0 - 39 MB | NPU
|
| 186 |
+
| GPUNet | TFLITE | w8a8 | Qualcomm® SA8295P | 0.917 ms | 0 - 36 MB | NPU
|
| 187 |
+
| GPUNet | TFLITE | w8a8 | Snapdragon® 8 Elite For Galaxy Mobile | 0.274 ms | 0 - 39 MB | NPU
|
| 188 |
+
| GPUNet | TFLITE | w8a8 | Snapdragon® 7 Gen 4 Mobile | 0.616 ms | 0 - 39 MB | NPU
|
| 189 |
+
| GPUNet | TFLITE | w8a8 | Snapdragon® 7 Gen 4 Mobile | 0.616 ms | 0 - 39 MB | NPU
|
| 190 |
|
| 191 |
## License
|
| 192 |
* The license for the original implementation of GPUNet can be found
|
release_assets.json
CHANGED
|
@@ -1,68 +1,68 @@
|
|
| 1 |
{
|
| 2 |
-
"version": "0.
|
| 3 |
"precisions": {
|
| 4 |
-
"
|
| 5 |
"universal_assets": {
|
| 6 |
"tflite": {
|
| 7 |
"tool_versions": {
|
| 8 |
"qairt": "2.45.0.260326154327",
|
| 9 |
-
"litert": "1.4.
|
| 10 |
},
|
| 11 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 12 |
},
|
| 13 |
"qnn_dlc": {
|
| 14 |
"tool_versions": {
|
| 15 |
"qairt": "2.45.0.260326154327"
|
| 16 |
},
|
| 17 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 18 |
},
|
| 19 |
"onnx": {
|
| 20 |
"tool_versions": {
|
| 21 |
"qairt": "2.42.0.251225135753_193295",
|
| 22 |
"onnx_runtime": "1.24.3"
|
| 23 |
},
|
| 24 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 25 |
}
|
| 26 |
}
|
| 27 |
},
|
| 28 |
-
"
|
| 29 |
"universal_assets": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 30 |
"qnn_dlc": {
|
| 31 |
"tool_versions": {
|
| 32 |
"qairt": "2.45.0.260326154327"
|
| 33 |
},
|
| 34 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 35 |
},
|
| 36 |
"onnx": {
|
| 37 |
"tool_versions": {
|
| 38 |
"qairt": "2.42.0.251225135753_193295",
|
| 39 |
"onnx_runtime": "1.24.3"
|
| 40 |
},
|
| 41 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 42 |
}
|
| 43 |
}
|
| 44 |
},
|
| 45 |
-
"
|
| 46 |
"universal_assets": {
|
| 47 |
-
"tflite": {
|
| 48 |
-
"tool_versions": {
|
| 49 |
-
"qairt": "2.45.0.260326154327",
|
| 50 |
-
"litert": "1.4.2"
|
| 51 |
-
},
|
| 52 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.52.0/gpunet-tflite-float.zip"
|
| 53 |
-
},
|
| 54 |
"qnn_dlc": {
|
| 55 |
"tool_versions": {
|
| 56 |
"qairt": "2.45.0.260326154327"
|
| 57 |
},
|
| 58 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 59 |
},
|
| 60 |
"onnx": {
|
| 61 |
"tool_versions": {
|
| 62 |
"qairt": "2.42.0.251225135753_193295",
|
| 63 |
"onnx_runtime": "1.24.3"
|
| 64 |
},
|
| 65 |
-
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.
|
| 66 |
}
|
| 67 |
}
|
| 68 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"version": "0.53.0",
|
| 3 |
"precisions": {
|
| 4 |
+
"float": {
|
| 5 |
"universal_assets": {
|
| 6 |
"tflite": {
|
| 7 |
"tool_versions": {
|
| 8 |
"qairt": "2.45.0.260326154327",
|
| 9 |
+
"litert": "1.4.3"
|
| 10 |
},
|
| 11 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-tflite-float.zip"
|
| 12 |
},
|
| 13 |
"qnn_dlc": {
|
| 14 |
"tool_versions": {
|
| 15 |
"qairt": "2.45.0.260326154327"
|
| 16 |
},
|
| 17 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-qnn_dlc-float.zip"
|
| 18 |
},
|
| 19 |
"onnx": {
|
| 20 |
"tool_versions": {
|
| 21 |
"qairt": "2.42.0.251225135753_193295",
|
| 22 |
"onnx_runtime": "1.24.3"
|
| 23 |
},
|
| 24 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-onnx-float.zip"
|
| 25 |
}
|
| 26 |
}
|
| 27 |
},
|
| 28 |
+
"w8a8": {
|
| 29 |
"universal_assets": {
|
| 30 |
+
"tflite": {
|
| 31 |
+
"tool_versions": {
|
| 32 |
+
"qairt": "2.45.0.260326154327",
|
| 33 |
+
"litert": "1.4.3"
|
| 34 |
+
},
|
| 35 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-tflite-w8a8.zip"
|
| 36 |
+
},
|
| 37 |
"qnn_dlc": {
|
| 38 |
"tool_versions": {
|
| 39 |
"qairt": "2.45.0.260326154327"
|
| 40 |
},
|
| 41 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-qnn_dlc-w8a8.zip"
|
| 42 |
},
|
| 43 |
"onnx": {
|
| 44 |
"tool_versions": {
|
| 45 |
"qairt": "2.42.0.251225135753_193295",
|
| 46 |
"onnx_runtime": "1.24.3"
|
| 47 |
},
|
| 48 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-onnx-w8a8.zip"
|
| 49 |
}
|
| 50 |
}
|
| 51 |
},
|
| 52 |
+
"w8a16": {
|
| 53 |
"universal_assets": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 54 |
"qnn_dlc": {
|
| 55 |
"tool_versions": {
|
| 56 |
"qairt": "2.45.0.260326154327"
|
| 57 |
},
|
| 58 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-qnn_dlc-w8a16.zip"
|
| 59 |
},
|
| 60 |
"onnx": {
|
| 61 |
"tool_versions": {
|
| 62 |
"qairt": "2.42.0.251225135753_193295",
|
| 63 |
"onnx_runtime": "1.24.3"
|
| 64 |
},
|
| 65 |
+
"download_url": "https://qaihub-public-assets.s3.us-west-2.amazonaws.com/qai-hub-models/models/gpunet/releases/v0.53.0/gpunet-onnx-w8a16.zip"
|
| 66 |
}
|
| 67 |
}
|
| 68 |
}
|