Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- README.md +4 -2
- model_b1_s256.rknn +3 -0
- model_b4_s256.rknn +3 -0
- rknn.json +84 -0
.gitattributes
CHANGED
|
@@ -39,3 +39,5 @@ rknn/model_o1.rknn filter=lfs diff=lfs merge=lfs -text
|
|
| 39 |
rknn/model_o2.rknn filter=lfs diff=lfs merge=lfs -text
|
| 40 |
rknn/model_o3.rknn filter=lfs diff=lfs merge=lfs -text
|
| 41 |
rknn/model_w8a8.rknn filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 39 |
rknn/model_o2.rknn filter=lfs diff=lfs merge=lfs -text
|
| 40 |
rknn/model_o3.rknn filter=lfs diff=lfs merge=lfs -text
|
| 41 |
rknn/model_w8a8.rknn filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
model_b1_s256.rknn filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
model_b4_s256.rknn filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
|
@@ -13,8 +13,8 @@ tags:
|
|
| 13 |
- rk-transformers
|
| 14 |
- rk3588
|
| 15 |
pipeline_tag: sentence-similarity
|
| 16 |
-
base_model: sentence-transformers/all-MiniLM-L6-v2
|
| 17 |
model_name: all-MiniLM-L6-v2
|
|
|
|
| 18 |
---
|
| 19 |
# all-MiniLM-L6-v2 (RKNN2)
|
| 20 |
|
|
@@ -34,6 +34,8 @@ model_name: all-MiniLM-L6-v2
|
|
| 34 |
| Model File | Optimization Level | Quantization | File Size |
|
| 35 |
| :--------- | :----------------- | :----------- | :-------- |
|
| 36 |
| [model.rknn](./model.rknn) | 0 | float16 | 45.7 MB |
|
|
|
|
|
|
|
| 37 |
| [model_b4_s512.rknn](./model_b4_s512.rknn) | 0 | float16 | 52.5 MB |
|
| 38 |
| [rknn/model_o1.rknn](./rknn/model_o1.rknn) | 1 | float16 | 45.7 MB |
|
| 39 |
| [rknn/model_o2.rknn](./rknn/model_o2.rknn) | 2 | float16 | 45.7 MB |
|
|
@@ -102,7 +104,7 @@ model = RKRTModelForFeatureExtraction.from_pretrained(
|
|
| 102 |
inputs = tokenizer(
|
| 103 |
["Sample text for encoding"],
|
| 104 |
padding="max_length",
|
| 105 |
-
max_length=
|
| 106 |
truncation=True,
|
| 107 |
return_tensors="np"
|
| 108 |
)
|
|
|
|
| 13 |
- rk-transformers
|
| 14 |
- rk3588
|
| 15 |
pipeline_tag: sentence-similarity
|
|
|
|
| 16 |
model_name: all-MiniLM-L6-v2
|
| 17 |
+
base_model: sentence-transformers/all-MiniLM-L6-v2
|
| 18 |
---
|
| 19 |
# all-MiniLM-L6-v2 (RKNN2)
|
| 20 |
|
|
|
|
| 34 |
| Model File | Optimization Level | Quantization | File Size |
|
| 35 |
| :--------- | :----------------- | :----------- | :-------- |
|
| 36 |
| [model.rknn](./model.rknn) | 0 | float16 | 45.7 MB |
|
| 37 |
+
| [model_b1_s256.rknn](./model_b1_s256.rknn) | 0 | float16 | 44.7 MB |
|
| 38 |
+
| [model_b4_s256.rknn](./model_b4_s256.rknn) | 0 | float16 | 48.9 MB |
|
| 39 |
| [model_b4_s512.rknn](./model_b4_s512.rknn) | 0 | float16 | 52.5 MB |
|
| 40 |
| [rknn/model_o1.rknn](./rknn/model_o1.rknn) | 1 | float16 | 45.7 MB |
|
| 41 |
| [rknn/model_o2.rknn](./rknn/model_o2.rknn) | 2 | float16 | 45.7 MB |
|
|
|
|
| 104 |
inputs = tokenizer(
|
| 105 |
["Sample text for encoding"],
|
| 106 |
padding="max_length",
|
| 107 |
+
max_length=256,
|
| 108 |
truncation=True,
|
| 109 |
return_tensors="np"
|
| 110 |
)
|
model_b1_s256.rknn
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14315427c644d669134f3620ba1efe97dc6972bb28c53340e7363bf2e08bfc6b
|
| 3 |
+
size 46920212
|
model_b4_s256.rknn
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4eae8ea4b3dd8bd2332da540b52a0f8707cf5f890fc31bd91d221ca1d85de64c
|
| 3 |
+
size 51320404
|
rknn.json
CHANGED
|
@@ -254,5 +254,89 @@
|
|
| 254 |
"sparse_infer": false,
|
| 255 |
"model_pruning": false
|
| 256 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 257 |
}
|
| 258 |
}
|
|
|
|
| 254 |
"sparse_infer": false,
|
| 255 |
"model_pruning": false
|
| 256 |
}
|
| 257 |
+
},
|
| 258 |
+
"model_b1_s256.rknn": {
|
| 259 |
+
"model_input_names": [
|
| 260 |
+
"input_ids",
|
| 261 |
+
"attention_mask"
|
| 262 |
+
],
|
| 263 |
+
"batch_size": 1,
|
| 264 |
+
"max_seq_length": 256,
|
| 265 |
+
"float_dtype": "float16",
|
| 266 |
+
"target_platform": "rk3588",
|
| 267 |
+
"single_core_mode": false,
|
| 268 |
+
"mean_values": null,
|
| 269 |
+
"std_values": null,
|
| 270 |
+
"custom_string": null,
|
| 271 |
+
"inputs_yuv_fmt": null,
|
| 272 |
+
"dynamic_input": null,
|
| 273 |
+
"opset": 18,
|
| 274 |
+
"task": "auto",
|
| 275 |
+
"quantization": {
|
| 276 |
+
"do_quantization": false,
|
| 277 |
+
"dataset_name": null,
|
| 278 |
+
"dataset_subset": null,
|
| 279 |
+
"dataset_size": 128,
|
| 280 |
+
"dataset_split": null,
|
| 281 |
+
"dataset_columns": null,
|
| 282 |
+
"quantized_dtype": "w8a8",
|
| 283 |
+
"quantized_algorithm": "normal",
|
| 284 |
+
"quantized_method": "channel",
|
| 285 |
+
"quantized_hybrid_level": 0,
|
| 286 |
+
"quant_img_RGB2BGR": false,
|
| 287 |
+
"auto_hybrid_cos_thresh": 0.98,
|
| 288 |
+
"auto_hybrid_euc_thresh": null
|
| 289 |
+
},
|
| 290 |
+
"optimization": {
|
| 291 |
+
"optimization_level": 0,
|
| 292 |
+
"enable_flash_attention": true,
|
| 293 |
+
"remove_weight": false,
|
| 294 |
+
"compress_weight": false,
|
| 295 |
+
"remove_reshape": false,
|
| 296 |
+
"sparse_infer": false,
|
| 297 |
+
"model_pruning": false
|
| 298 |
+
}
|
| 299 |
+
},
|
| 300 |
+
"model_b4_s256.rknn": {
|
| 301 |
+
"model_input_names": [
|
| 302 |
+
"input_ids",
|
| 303 |
+
"attention_mask"
|
| 304 |
+
],
|
| 305 |
+
"batch_size": 4,
|
| 306 |
+
"max_seq_length": 256,
|
| 307 |
+
"float_dtype": "float16",
|
| 308 |
+
"target_platform": "rk3588",
|
| 309 |
+
"single_core_mode": false,
|
| 310 |
+
"mean_values": null,
|
| 311 |
+
"std_values": null,
|
| 312 |
+
"custom_string": null,
|
| 313 |
+
"inputs_yuv_fmt": null,
|
| 314 |
+
"dynamic_input": null,
|
| 315 |
+
"opset": 18,
|
| 316 |
+
"task": "auto",
|
| 317 |
+
"quantization": {
|
| 318 |
+
"do_quantization": false,
|
| 319 |
+
"dataset_name": null,
|
| 320 |
+
"dataset_subset": null,
|
| 321 |
+
"dataset_size": 128,
|
| 322 |
+
"dataset_split": null,
|
| 323 |
+
"dataset_columns": null,
|
| 324 |
+
"quantized_dtype": "w8a8",
|
| 325 |
+
"quantized_algorithm": "normal",
|
| 326 |
+
"quantized_method": "channel",
|
| 327 |
+
"quantized_hybrid_level": 0,
|
| 328 |
+
"quant_img_RGB2BGR": false,
|
| 329 |
+
"auto_hybrid_cos_thresh": 0.98,
|
| 330 |
+
"auto_hybrid_euc_thresh": null
|
| 331 |
+
},
|
| 332 |
+
"optimization": {
|
| 333 |
+
"optimization_level": 0,
|
| 334 |
+
"enable_flash_attention": true,
|
| 335 |
+
"remove_weight": false,
|
| 336 |
+
"compress_weight": false,
|
| 337 |
+
"remove_reshape": false,
|
| 338 |
+
"sparse_infer": false,
|
| 339 |
+
"model_pruning": false
|
| 340 |
+
}
|
| 341 |
}
|
| 342 |
}
|