Upload 29 files
Browse filesinitial the repo, and update the axmodel of AX650 and AX630C
- .gitattributes +6 -0
- ax620e/base/base-decoder-loop.axmodel +3 -0
- ax620e/base/base-decoder-main.axmodel +3 -0
- ax620e/base/base-encoder.axmodel +3 -0
- ax620e/base/base-positional_embedding.bin +3 -0
- ax620e/base/base-tokens.txt +0 -0
- ax620e/install/TSCharacters.ocd2 +0 -0
- ax620e/install/TSPhrases.ocd2 +0 -0
- ax620e/install/t2s.json +22 -0
- ax620e/install/whisper +0 -0
- ax650/install/TSCharacters.ocd2 +0 -0
- ax650/install/TSPhrases.ocd2 +0 -0
- ax650/install/t2s.json +22 -0
- ax650/install/whisper +0 -0
- ax650/small/small-decoder-loop.axmodel +3 -0
- ax650/small/small-decoder-main.axmodel +3 -0
- ax650/small/small-encoder.axmodel +3 -0
- ax650/small/small-positional_embedding.bin +3 -0
- ax650/small/small-tokens.txt +0 -0
- ax650/tiny/tiny-decoder-loop.axmodel.onnx +3 -0
- ax650/tiny/tiny-decoder-main.axmodel.onnx +3 -0
- ax650/tiny/tiny-encoder.axmodel.onnx +3 -0
- ax650/tiny/tiny-positional_embedding.bin +3 -0
- ax650/tiny/tiny-tokens.txt +0 -0
- axcl_aarch64/whisper +0 -0
- config_whisper_decoder_loop_u16.json +78 -0
- config_whisper_decoder_main_u16.json +54 -0
- config_whisper_encoder_u16.json +30 -0
- datasets.zip +3 -0
- demo.wav +0 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
ax620e/base/base-decoder-loop.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
ax620e/base/base-decoder-main.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
ax620e/base/base-encoder.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
ax650/small/small-decoder-loop.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
ax650/small/small-decoder-main.axmodel filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
ax650/small/small-encoder.axmodel filter=lfs diff=lfs merge=lfs -text
|
ax620e/base/base-decoder-loop.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4133ed1d67dbf4906b8dc4e59a642b558ffc46e461c9f6688045babe5a3a60ca
|
| 3 |
+
size 130371061
|
ax620e/base/base-decoder-main.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c5bdd733b666aaac06144f1f780dfcdb961e131d658e4a499e14a25dde42688
|
| 3 |
+
size 135674831
|
ax620e/base/base-encoder.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7238ad68dd496ed3c54acc9312dec4e559a9640cb504aea33f12aae93077e94
|
| 3 |
+
size 56035119
|
ax620e/base/base-positional_embedding.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88fa1cdbf2b06f86b0ecb7be0fccfc39e906502986572b8cf5319c250e857169
|
| 3 |
+
size 917504
|
ax620e/base/base-tokens.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
ax620e/install/TSCharacters.ocd2
ADDED
|
Binary file (46.1 kB). View file
|
|
|
ax620e/install/TSPhrases.ocd2
ADDED
|
Binary file (9.78 kB). View file
|
|
|
ax620e/install/t2s.json
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "Traditional Chinese to Simplified Chinese",
|
| 3 |
+
"segmentation": {
|
| 4 |
+
"type": "mmseg",
|
| 5 |
+
"dict": {
|
| 6 |
+
"type": "ocd2",
|
| 7 |
+
"file": "TSPhrases.ocd2"
|
| 8 |
+
}
|
| 9 |
+
},
|
| 10 |
+
"conversion_chain": [{
|
| 11 |
+
"dict": {
|
| 12 |
+
"type": "group",
|
| 13 |
+
"dicts": [{
|
| 14 |
+
"type": "ocd2",
|
| 15 |
+
"file": "TSPhrases.ocd2"
|
| 16 |
+
}, {
|
| 17 |
+
"type": "ocd2",
|
| 18 |
+
"file": "TSCharacters.ocd2"
|
| 19 |
+
}]
|
| 20 |
+
}
|
| 21 |
+
}]
|
| 22 |
+
}
|
ax620e/install/whisper
ADDED
|
Binary file (490 kB). View file
|
|
|
ax650/install/TSCharacters.ocd2
ADDED
|
Binary file (46.1 kB). View file
|
|
|
ax650/install/TSPhrases.ocd2
ADDED
|
Binary file (9.78 kB). View file
|
|
|
ax650/install/t2s.json
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "Traditional Chinese to Simplified Chinese",
|
| 3 |
+
"segmentation": {
|
| 4 |
+
"type": "mmseg",
|
| 5 |
+
"dict": {
|
| 6 |
+
"type": "ocd2",
|
| 7 |
+
"file": "TSPhrases.ocd2"
|
| 8 |
+
}
|
| 9 |
+
},
|
| 10 |
+
"conversion_chain": [{
|
| 11 |
+
"dict": {
|
| 12 |
+
"type": "group",
|
| 13 |
+
"dicts": [{
|
| 14 |
+
"type": "ocd2",
|
| 15 |
+
"file": "TSPhrases.ocd2"
|
| 16 |
+
}, {
|
| 17 |
+
"type": "ocd2",
|
| 18 |
+
"file": "TSCharacters.ocd2"
|
| 19 |
+
}]
|
| 20 |
+
}
|
| 21 |
+
}]
|
| 22 |
+
}
|
ax650/install/whisper
ADDED
|
Binary file (486 kB). View file
|
|
|
ax650/small/small-decoder-loop.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b472a0f3539d17fece09e92bf6cd69ebf391928a6050896bbf86b558a25def22
|
| 3 |
+
size 269002567
|
ax650/small/small-decoder-main.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3bfc577f60c35192d8ce8cc24f9ca4aa84af72756ba11af9d178d337cb7eb1c
|
| 3 |
+
size 285531695
|
ax650/small/small-encoder.axmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b3bc8db9762f9b2dfe78bffbc8070fb877b2572c5288253573e49a8c7b37948
|
| 3 |
+
size 139705612
|
ax650/small/small-positional_embedding.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c10bc44f2bd94bdf1b7aa03581309fa536132b3fe79bfe22c9a6934a42cd8b58
|
| 3 |
+
size 1376256
|
ax650/small/small-tokens.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
ax650/tiny/tiny-decoder-loop.axmodel.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b600ff566563a68cd1b1902082b1587aa67dc127cd9ef13b1cdc42bfc257375b
|
| 3 |
+
size 128477481
|
ax650/tiny/tiny-decoder-main.axmodel.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50beadff2619fe099821aa28351c1cf887b5b1c97a4e696541314d6d43131dc7
|
| 3 |
+
size 131255063
|
ax650/tiny/tiny-encoder.axmodel.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:627b1a55b5daa32db0079f8902d006e4d1c86d60f29c72d3a1914311c4b83f55
|
| 3 |
+
size 14422649
|
ax650/tiny/tiny-positional_embedding.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c13450ae630323a0bdd39b1226f92a7ac251131a909c7efdb7d2f5516736eb83
|
| 3 |
+
size 688128
|
ax650/tiny/tiny-tokens.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
axcl_aarch64/whisper
ADDED
|
Binary file (559 kB). View file
|
|
|
config_whisper_decoder_loop_u16.json
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "ONNX",
|
| 3 |
+
"npu_mode": "NPU3",
|
| 4 |
+
"quant": {
|
| 5 |
+
"input_configs": [
|
| 6 |
+
{
|
| 7 |
+
"tensor_name": "tokens",
|
| 8 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/tokens.tar.gz",
|
| 9 |
+
"calibration_size": -1,
|
| 10 |
+
"calibration_format": "Numpy"
|
| 11 |
+
},
|
| 12 |
+
{
|
| 13 |
+
"tensor_name": "n_layer_cross_k",
|
| 14 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/n_layer_cross_k.tar.gz",
|
| 15 |
+
"calibration_size": -1,
|
| 16 |
+
"calibration_format": "Numpy"
|
| 17 |
+
},
|
| 18 |
+
{
|
| 19 |
+
"tensor_name": "in_n_layer_self_k_cache",
|
| 20 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/n_layer_self_k_cache.tar.gz",
|
| 21 |
+
"calibration_size": -1,
|
| 22 |
+
"calibration_format": "Numpy"
|
| 23 |
+
},
|
| 24 |
+
{
|
| 25 |
+
"tensor_name": "in_n_layer_self_v_cache",
|
| 26 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/n_layer_self_v_cache.tar.gz",
|
| 27 |
+
"calibration_size": -1,
|
| 28 |
+
"calibration_format": "Numpy"
|
| 29 |
+
},
|
| 30 |
+
{
|
| 31 |
+
"tensor_name": "n_layer_cross_v",
|
| 32 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/n_layer_cross_v.tar.gz",
|
| 33 |
+
"calibration_size": -1,
|
| 34 |
+
"calibration_format": "Numpy"
|
| 35 |
+
},
|
| 36 |
+
{
|
| 37 |
+
"tensor_name": "positional_embedding",
|
| 38 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/positional_embedding.tar.gz",
|
| 39 |
+
"calibration_size": -1,
|
| 40 |
+
"calibration_format": "Numpy"
|
| 41 |
+
},
|
| 42 |
+
{
|
| 43 |
+
"tensor_name": "mask",
|
| 44 |
+
"calibration_dataset": "./calibrations_tiny/decoder_loop/mask.tar.gz",
|
| 45 |
+
"calibration_size": -1,
|
| 46 |
+
"calibration_format": "Numpy"
|
| 47 |
+
}
|
| 48 |
+
],
|
| 49 |
+
"layer_configs": [
|
| 50 |
+
{
|
| 51 |
+
"start_tensor_names": ["DEFAULT"],
|
| 52 |
+
"end_tensor_names": ["DEFAULT"],
|
| 53 |
+
"data_type": "U16"
|
| 54 |
+
},
|
| 55 |
+
{
|
| 56 |
+
"op_types": ["Gather"],
|
| 57 |
+
"data_type": "FP32"
|
| 58 |
+
},
|
| 59 |
+
{
|
| 60 |
+
"layer_names": ["/Add_1", "/Add_5", "/Add_9", "/Add_13"],
|
| 61 |
+
"data_type": "FP32"
|
| 62 |
+
},
|
| 63 |
+
{
|
| 64 |
+
"layer_names": ["/Softmax", "/Softmax_2", "/Softmax_4", "/Softmax_6"],
|
| 65 |
+
"data_type": "FP32"
|
| 66 |
+
}
|
| 67 |
+
],
|
| 68 |
+
"calibration_method": "MinMax"
|
| 69 |
+
},
|
| 70 |
+
"input_processors": [
|
| 71 |
+
{
|
| 72 |
+
"tensor_name": "DEFAULT"
|
| 73 |
+
}
|
| 74 |
+
],
|
| 75 |
+
"compiler": {
|
| 76 |
+
"check": 2
|
| 77 |
+
}
|
| 78 |
+
}
|
config_whisper_decoder_main_u16.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "ONNX",
|
| 3 |
+
"npu_mode": "NPU3",
|
| 4 |
+
"quant": {
|
| 5 |
+
"input_configs": [
|
| 6 |
+
{
|
| 7 |
+
"tensor_name": "tokens",
|
| 8 |
+
"calibration_dataset": "./calibrations_tiny/decoder_main/tokens.tar.gz",
|
| 9 |
+
"calibration_size": -1,
|
| 10 |
+
"calibration_format": "Numpy"
|
| 11 |
+
},
|
| 12 |
+
{
|
| 13 |
+
"tensor_name": "n_layer_cross_k",
|
| 14 |
+
"calibration_dataset": "./calibrations_tiny/decoder_main/n_layer_cross_k.tar.gz",
|
| 15 |
+
"calibration_size": -1,
|
| 16 |
+
"calibration_format": "Numpy"
|
| 17 |
+
},
|
| 18 |
+
{
|
| 19 |
+
"tensor_name": "n_layer_cross_v",
|
| 20 |
+
"calibration_dataset": "./calibrations_tiny/decoder_main/n_layer_cross_v.tar.gz",
|
| 21 |
+
"calibration_size": -1,
|
| 22 |
+
"calibration_format": "Numpy"
|
| 23 |
+
}
|
| 24 |
+
],
|
| 25 |
+
"layer_configs": [
|
| 26 |
+
{
|
| 27 |
+
"start_tensor_names": ["DEFAULT"],
|
| 28 |
+
"end_tensor_names": ["DEFAULT"],
|
| 29 |
+
"data_type": "U16"
|
| 30 |
+
},
|
| 31 |
+
{
|
| 32 |
+
"op_types": ["Gather"],
|
| 33 |
+
"data_type": "FP32"
|
| 34 |
+
},
|
| 35 |
+
{
|
| 36 |
+
"layer_names": ["/Add_1", "/Add_5", "/Add_9", "/Add_13"],
|
| 37 |
+
"data_type": "FP32"
|
| 38 |
+
},
|
| 39 |
+
{
|
| 40 |
+
"layer_names": ["/Softmax", "/Softmax_2", "/Softmax_4", "/Softmax_6"],
|
| 41 |
+
"data_type": "FP32"
|
| 42 |
+
}
|
| 43 |
+
],
|
| 44 |
+
"calibration_method": "MinMax"
|
| 45 |
+
},
|
| 46 |
+
"input_processors": [
|
| 47 |
+
{
|
| 48 |
+
"tensor_name": "DEFAULT"
|
| 49 |
+
}
|
| 50 |
+
],
|
| 51 |
+
"compiler": {
|
| 52 |
+
"check": 2
|
| 53 |
+
}
|
| 54 |
+
}
|
config_whisper_encoder_u16.json
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "ONNX",
|
| 3 |
+
"npu_mode": "NPU3",
|
| 4 |
+
"quant": {
|
| 5 |
+
"input_configs": [
|
| 6 |
+
{
|
| 7 |
+
"tensor_name": "mel",
|
| 8 |
+
"calibration_dataset": "./calibrations_tiny/encoder/mel.tar.gz",
|
| 9 |
+
"calibration_size": -1,
|
| 10 |
+
"calibration_format": "Numpy"
|
| 11 |
+
}
|
| 12 |
+
],
|
| 13 |
+
"layer_configs": [
|
| 14 |
+
{
|
| 15 |
+
"start_tensor_names": ["DEFAULT"],
|
| 16 |
+
"end_tensor_names": ["DEFAULT"],
|
| 17 |
+
"data_type": "U16"
|
| 18 |
+
}
|
| 19 |
+
],
|
| 20 |
+
"calibration_method": "MinMax"
|
| 21 |
+
},
|
| 22 |
+
"input_processors": [
|
| 23 |
+
{
|
| 24 |
+
"tensor_name": "mel"
|
| 25 |
+
}
|
| 26 |
+
],
|
| 27 |
+
"compiler": {
|
| 28 |
+
"check": 3
|
| 29 |
+
}
|
| 30 |
+
}
|
datasets.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2bd7b4da356313a433cb119aa37e960f925b288d7133cfbd5106800fa28c6523
|
| 3 |
+
size 41523788
|
demo.wav
ADDED
|
Binary file (135 kB). View file
|
|
|