eacortes commited on
Commit
e9b0913
·
verified ·
1 Parent(s): 0e69c09

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. .gitattributes +2 -0
  2. README.md +4 -2
  3. model_b1_s256.rknn +3 -0
  4. model_b4_s256.rknn +3 -0
  5. rknn.json +84 -0
.gitattributes CHANGED
@@ -39,3 +39,5 @@ rknn/model_o1.rknn filter=lfs diff=lfs merge=lfs -text
39
  rknn/model_o2.rknn filter=lfs diff=lfs merge=lfs -text
40
  rknn/model_o3.rknn filter=lfs diff=lfs merge=lfs -text
41
  rknn/model_w8a8.rknn filter=lfs diff=lfs merge=lfs -text
 
 
 
39
  rknn/model_o2.rknn filter=lfs diff=lfs merge=lfs -text
40
  rknn/model_o3.rknn filter=lfs diff=lfs merge=lfs -text
41
  rknn/model_w8a8.rknn filter=lfs diff=lfs merge=lfs -text
42
+ model_b1_s256.rknn filter=lfs diff=lfs merge=lfs -text
43
+ model_b4_s256.rknn filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -13,8 +13,8 @@ tags:
13
  - rk-transformers
14
  - rk3588
15
  pipeline_tag: sentence-similarity
16
- base_model: sentence-transformers/all-MiniLM-L6-v2
17
  model_name: all-MiniLM-L6-v2
 
18
  ---
19
  # all-MiniLM-L6-v2 (RKNN2)
20
 
@@ -34,6 +34,8 @@ model_name: all-MiniLM-L6-v2
34
  | Model File | Optimization Level | Quantization | File Size |
35
  | :--------- | :----------------- | :----------- | :-------- |
36
  | [model.rknn](./model.rknn) | 0 | float16 | 45.7 MB |
 
 
37
  | [model_b4_s512.rknn](./model_b4_s512.rknn) | 0 | float16 | 52.5 MB |
38
  | [rknn/model_o1.rknn](./rknn/model_o1.rknn) | 1 | float16 | 45.7 MB |
39
  | [rknn/model_o2.rknn](./rknn/model_o2.rknn) | 2 | float16 | 45.7 MB |
@@ -102,7 +104,7 @@ model = RKRTModelForFeatureExtraction.from_pretrained(
102
  inputs = tokenizer(
103
  ["Sample text for encoding"],
104
  padding="max_length",
105
- max_length=512,
106
  truncation=True,
107
  return_tensors="np"
108
  )
 
13
  - rk-transformers
14
  - rk3588
15
  pipeline_tag: sentence-similarity
 
16
  model_name: all-MiniLM-L6-v2
17
+ base_model: sentence-transformers/all-MiniLM-L6-v2
18
  ---
19
  # all-MiniLM-L6-v2 (RKNN2)
20
 
 
34
  | Model File | Optimization Level | Quantization | File Size |
35
  | :--------- | :----------------- | :----------- | :-------- |
36
  | [model.rknn](./model.rknn) | 0 | float16 | 45.7 MB |
37
+ | [model_b1_s256.rknn](./model_b1_s256.rknn) | 0 | float16 | 44.7 MB |
38
+ | [model_b4_s256.rknn](./model_b4_s256.rknn) | 0 | float16 | 48.9 MB |
39
  | [model_b4_s512.rknn](./model_b4_s512.rknn) | 0 | float16 | 52.5 MB |
40
  | [rknn/model_o1.rknn](./rknn/model_o1.rknn) | 1 | float16 | 45.7 MB |
41
  | [rknn/model_o2.rknn](./rknn/model_o2.rknn) | 2 | float16 | 45.7 MB |
 
104
  inputs = tokenizer(
105
  ["Sample text for encoding"],
106
  padding="max_length",
107
+ max_length=256,
108
  truncation=True,
109
  return_tensors="np"
110
  )
model_b1_s256.rknn ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14315427c644d669134f3620ba1efe97dc6972bb28c53340e7363bf2e08bfc6b
3
+ size 46920212
model_b4_s256.rknn ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eae8ea4b3dd8bd2332da540b52a0f8707cf5f890fc31bd91d221ca1d85de64c
3
+ size 51320404
rknn.json CHANGED
@@ -254,5 +254,89 @@
254
  "sparse_infer": false,
255
  "model_pruning": false
256
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
257
  }
258
  }
 
254
  "sparse_infer": false,
255
  "model_pruning": false
256
  }
257
+ },
258
+ "model_b1_s256.rknn": {
259
+ "model_input_names": [
260
+ "input_ids",
261
+ "attention_mask"
262
+ ],
263
+ "batch_size": 1,
264
+ "max_seq_length": 256,
265
+ "float_dtype": "float16",
266
+ "target_platform": "rk3588",
267
+ "single_core_mode": false,
268
+ "mean_values": null,
269
+ "std_values": null,
270
+ "custom_string": null,
271
+ "inputs_yuv_fmt": null,
272
+ "dynamic_input": null,
273
+ "opset": 18,
274
+ "task": "auto",
275
+ "quantization": {
276
+ "do_quantization": false,
277
+ "dataset_name": null,
278
+ "dataset_subset": null,
279
+ "dataset_size": 128,
280
+ "dataset_split": null,
281
+ "dataset_columns": null,
282
+ "quantized_dtype": "w8a8",
283
+ "quantized_algorithm": "normal",
284
+ "quantized_method": "channel",
285
+ "quantized_hybrid_level": 0,
286
+ "quant_img_RGB2BGR": false,
287
+ "auto_hybrid_cos_thresh": 0.98,
288
+ "auto_hybrid_euc_thresh": null
289
+ },
290
+ "optimization": {
291
+ "optimization_level": 0,
292
+ "enable_flash_attention": true,
293
+ "remove_weight": false,
294
+ "compress_weight": false,
295
+ "remove_reshape": false,
296
+ "sparse_infer": false,
297
+ "model_pruning": false
298
+ }
299
+ },
300
+ "model_b4_s256.rknn": {
301
+ "model_input_names": [
302
+ "input_ids",
303
+ "attention_mask"
304
+ ],
305
+ "batch_size": 4,
306
+ "max_seq_length": 256,
307
+ "float_dtype": "float16",
308
+ "target_platform": "rk3588",
309
+ "single_core_mode": false,
310
+ "mean_values": null,
311
+ "std_values": null,
312
+ "custom_string": null,
313
+ "inputs_yuv_fmt": null,
314
+ "dynamic_input": null,
315
+ "opset": 18,
316
+ "task": "auto",
317
+ "quantization": {
318
+ "do_quantization": false,
319
+ "dataset_name": null,
320
+ "dataset_subset": null,
321
+ "dataset_size": 128,
322
+ "dataset_split": null,
323
+ "dataset_columns": null,
324
+ "quantized_dtype": "w8a8",
325
+ "quantized_algorithm": "normal",
326
+ "quantized_method": "channel",
327
+ "quantized_hybrid_level": 0,
328
+ "quant_img_RGB2BGR": false,
329
+ "auto_hybrid_cos_thresh": 0.98,
330
+ "auto_hybrid_euc_thresh": null
331
+ },
332
+ "optimization": {
333
+ "optimization_level": 0,
334
+ "enable_flash_attention": true,
335
+ "remove_weight": false,
336
+ "compress_weight": false,
337
+ "remove_reshape": false,
338
+ "sparse_infer": false,
339
+ "model_pruning": false
340
+ }
341
  }
342
  }