v0.36.0
Browse filesSee https://github.com/quic/ai-hub-models/releases/v0.36.0 for changelog.
- Nomic-Embed-Text.dlc +2 -2
- Nomic-Embed-Text.onnx.zip +2 -2
- Nomic-Embed-Text.tflite +2 -2
- README.md +29 -29
- precompiled/qualcomm-snapdragon-x-elite/Nomic-Embed-Text.bin +2 -2
- precompiled/qualcomm-snapdragon-x-elite/Nomic-Embed-Text.onnx.zip +2 -2
- precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml +1 -1
- sdk_versions.yml +3 -3
Nomic-Embed-Text.dlc
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a249613aa0e2e849f8b2feadfcadae8c343d60cfe4a3e37fcdc95a4ef70d89ad
|
| 3 |
+
size 547931588
|
Nomic-Embed-Text.onnx.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:527ece7c4692bdddcb2d0db096106f9b3215e243da84b23a42dc808849d19da5
|
| 3 |
+
size 507492854
|
Nomic-Embed-Text.tflite
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:345165780d2537d4720ed5bddda141d1938fba403c1041ff05d8788c5f8e651f
|
| 3 |
+
size 547919472
|
README.md
CHANGED
|
@@ -35,35 +35,35 @@ More details on model performance across various devices, can be found
|
|
| 35 |
|
| 36 |
| Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model
|
| 37 |
|---|---|---|---|---|---|---|---|---|
|
| 38 |
-
| Nomic-Embed-Text | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE |
|
| 39 |
-
| Nomic-Embed-Text | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 28.
|
| 40 |
-
| Nomic-Embed-Text | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE |
|
| 41 |
-
| Nomic-Embed-Text | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 10.
|
| 42 |
-
| Nomic-Embed-Text | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE |
|
| 43 |
-
| Nomic-Embed-Text | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 7.
|
| 44 |
-
| Nomic-Embed-Text | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE |
|
| 45 |
-
| Nomic-Embed-Text | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 9.
|
| 46 |
-
| Nomic-Embed-Text | float | SA7255P ADP | Qualcomm® SA7255P | TFLITE |
|
| 47 |
-
| Nomic-Embed-Text | float | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 28.
|
| 48 |
-
| Nomic-Embed-Text | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | TFLITE |
|
| 49 |
-
| Nomic-Embed-Text | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 7.
|
| 50 |
-
| Nomic-Embed-Text | float | SA8295P ADP | Qualcomm® SA8295P | TFLITE |
|
| 51 |
-
| Nomic-Embed-Text | float | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 10.
|
| 52 |
-
| Nomic-Embed-Text | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | TFLITE |
|
| 53 |
-
| Nomic-Embed-Text | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 7.
|
| 54 |
-
| Nomic-Embed-Text | float | SA8775P ADP | Qualcomm® SA8775P | TFLITE |
|
| 55 |
-
| Nomic-Embed-Text | float | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 9.
|
| 56 |
-
| Nomic-Embed-Text | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE |
|
| 57 |
-
| Nomic-Embed-Text | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 7.
|
| 58 |
-
| Nomic-Embed-Text | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 8.
|
| 59 |
-
| Nomic-Embed-Text | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE |
|
| 60 |
-
| Nomic-Embed-Text | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 5.
|
| 61 |
-
| Nomic-Embed-Text | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 5.
|
| 62 |
-
| Nomic-Embed-Text | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE |
|
| 63 |
-
| Nomic-Embed-Text | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC |
|
| 64 |
-
| Nomic-Embed-Text | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 5.
|
| 65 |
-
| Nomic-Embed-Text | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC |
|
| 66 |
-
| Nomic-Embed-Text | float | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 9.
|
| 67 |
|
| 68 |
|
| 69 |
|
|
|
|
| 35 |
|
| 36 |
| Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model
|
| 37 |
|---|---|---|---|---|---|---|---|---|
|
| 38 |
+
| Nomic-Embed-Text | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 31.651 ms | 0 - 364 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 39 |
+
| Nomic-Embed-Text | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 28.185 ms | 0 - 361 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 40 |
+
| Nomic-Embed-Text | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 10.867 ms | 0 - 372 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 41 |
+
| Nomic-Embed-Text | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 10.794 ms | 0 - 371 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 42 |
+
| Nomic-Embed-Text | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 8.779 ms | 0 - 15 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 43 |
+
| Nomic-Embed-Text | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 7.292 ms | 0 - 25 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 44 |
+
| Nomic-Embed-Text | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 11.131 ms | 0 - 364 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 45 |
+
| Nomic-Embed-Text | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 9.688 ms | 0 - 363 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 46 |
+
| Nomic-Embed-Text | float | SA7255P ADP | Qualcomm® SA7255P | TFLITE | 31.651 ms | 0 - 364 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 47 |
+
| Nomic-Embed-Text | float | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 28.185 ms | 0 - 361 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 48 |
+
| Nomic-Embed-Text | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | TFLITE | 8.813 ms | 3 - 29 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 49 |
+
| Nomic-Embed-Text | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 7.474 ms | 0 - 23 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 50 |
+
| Nomic-Embed-Text | float | SA8295P ADP | Qualcomm® SA8295P | TFLITE | 12.375 ms | 0 - 358 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 51 |
+
| Nomic-Embed-Text | float | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 10.607 ms | 0 - 356 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 52 |
+
| Nomic-Embed-Text | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | TFLITE | 8.839 ms | 0 - 15 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 53 |
+
| Nomic-Embed-Text | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 7.423 ms | 0 - 23 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 54 |
+
| Nomic-Embed-Text | float | SA8775P ADP | Qualcomm® SA8775P | TFLITE | 11.131 ms | 0 - 364 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 55 |
+
| Nomic-Embed-Text | float | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 9.688 ms | 0 - 363 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 56 |
+
| Nomic-Embed-Text | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE | 8.77 ms | 0 - 15 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 57 |
+
| Nomic-Embed-Text | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 7.484 ms | 0 - 27 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 58 |
+
| Nomic-Embed-Text | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 8.07 ms | 0 - 25 MB | NPU | [Nomic-Embed-Text.onnx.zip](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.onnx.zip) |
|
| 59 |
+
| Nomic-Embed-Text | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 6.405 ms | 0 - 370 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 60 |
+
| Nomic-Embed-Text | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 5.308 ms | 0 - 372 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 61 |
+
| Nomic-Embed-Text | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 5.876 ms | 0 - 377 MB | NPU | [Nomic-Embed-Text.onnx.zip](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.onnx.zip) |
|
| 62 |
+
| Nomic-Embed-Text | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE | 6.247 ms | 0 - 365 MB | NPU | [Nomic-Embed-Text.tflite](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.tflite) |
|
| 63 |
+
| Nomic-Embed-Text | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 4.962 ms | 0 - 364 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 64 |
+
| Nomic-Embed-Text | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 5.442 ms | 0 - 330 MB | NPU | [Nomic-Embed-Text.onnx.zip](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.onnx.zip) |
|
| 65 |
+
| Nomic-Embed-Text | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 7.997 ms | 1522 - 1522 MB | NPU | [Nomic-Embed-Text.dlc](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.dlc) |
|
| 66 |
+
| Nomic-Embed-Text | float | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 9.472 ms | 264 - 264 MB | NPU | [Nomic-Embed-Text.onnx.zip](https://huggingface.co/qualcomm/Nomic-Embed-Text/blob/main/Nomic-Embed-Text.onnx.zip) |
|
| 67 |
|
| 68 |
|
| 69 |
|
precompiled/qualcomm-snapdragon-x-elite/Nomic-Embed-Text.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91a1f095ba8258bef0040fe16be2304728b268007e4a653160354edb0ca15c61
|
| 3 |
+
size 274829312
|
precompiled/qualcomm-snapdragon-x-elite/Nomic-Embed-Text.onnx.zip
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48106dca5639aff0ba3d70ee07d41b6b415e7c65d12ea3269319039941ffba40
|
| 3 |
+
size 253746753
|
precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
sdk_versions:
|
| 2 |
qnn_context_binary:
|
| 3 |
-
qairt: 2.
|
| 4 |
precompiled_qnn_onnx:
|
| 5 |
qairt: 2.33.2.250410134701_117956
|
|
|
|
| 1 |
sdk_versions:
|
| 2 |
qnn_context_binary:
|
| 3 |
+
qairt: 2.37.0.250724175447_124859
|
| 4 |
precompiled_qnn_onnx:
|
| 5 |
qairt: 2.33.2.250410134701_117956
|
sdk_versions.yml
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
sdk_versions:
|
| 2 |
tflite:
|
| 3 |
-
qairt: 2.
|
| 4 |
tflite: 2.17.0
|
| 5 |
qnn_dlc:
|
| 6 |
-
qairt: 2.
|
| 7 |
onnx:
|
| 8 |
-
qairt: 2.
|
| 9 |
onnx_runtime: 1.22.0
|
|
|
|
| 1 |
sdk_versions:
|
| 2 |
tflite:
|
| 3 |
+
qairt: 2.37.0.250724175447_124859
|
| 4 |
tflite: 2.17.0
|
| 5 |
qnn_dlc:
|
| 6 |
+
qairt: 2.37.0.250724175447_124859
|
| 7 |
onnx:
|
| 8 |
+
qairt: 2.33.2.250410134701_117956
|
| 9 |
onnx_runtime: 1.22.0
|