aoiandroid mefengl commited on
Commit
4c78a46
·
0 Parent(s):

Duplicate from mefengl/SenseVoiceSmall-coreml

Browse files

Co-authored-by: mefengl <mefengl@users.noreply.huggingface.co>

.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: coreml
3
+ pipeline_tag: automatic-speech-recognition
4
+ tags:
5
+ - coreml
6
+ - speech-recognition
7
+ - sensevoice
8
+ - asr
9
+ license: other
10
+ license_name: funasr-model-license
11
+ license_link: https://github.com/modelscope/FunASR/blob/main/MODEL_LICENSE
12
+ language:
13
+ - zh
14
+ - en
15
+ - ja
16
+ - ko
17
+ - yue
18
+ ---
19
+
20
+ # SenseVoiceSmall-coreml
21
+
22
+ [Hugging Face](https://huggingface.co/mefengl/SenseVoiceSmall-coreml) | [GitHub](https://github.com/mefengl/SenseVoiceSmall-coreml)
23
+
24
+ CoreML artifact for **SenseVoiceSmall**.
25
+
26
+ - Upstream model: https://huggingface.co/FunAudioLLM/SenseVoiceSmall
27
+ - Upstream code: https://github.com/FunAudioLLM/SenseVoice
28
+
29
+ ## Download
30
+
31
+ ```bash
32
+ uvx hf download mefengl/SenseVoiceSmall-coreml --local-dir . \
33
+ --include "coreml/SenseVoiceSmall.mlmodelc.zip" \
34
+ --include "config.json" \
35
+ --include "checksums.sha256"
36
+ ```
37
+
38
+ ## Verify
39
+
40
+ ```bash
41
+ make verify
42
+ ```
43
+
44
+ ## Optional: generate CoreML `.mlpackage`
45
+
46
+ A CoreML conversion of SenseVoiceSmall, using the upstream model definition.
47
+
48
+ ```bash
49
+ # clones upstream code into ./.upstream/SenseVoice automatically
50
+ make convert DEPLOYMENT_TARGET=macOS15
51
+ # output: ./.coreml-build/SenseVoiceSmall.mlpackage
52
+ ```
53
+
54
+ ## Optional: rebuild `coreml/SenseVoiceSmall.mlmodelc.zip` from a `.mlpackage`
55
+
56
+ macOS + Xcode required.
57
+
58
+ ```bash
59
+ make build
60
+ make inspect
61
+ make verify
62
+ ```
63
+
64
+ ## Optional: compare (numeric)
65
+
66
+ Compare the CoreML output against the original PyTorch model.
67
+
68
+ ```bash
69
+ make compare \
70
+ MLPACKAGE=.coreml-build/SenseVoiceSmall.mlpackage
71
+ # SENSEVOICE_REPO defaults to ./.upstream/SenseVoice (auto-cloned by `make upstream`)
72
+ ```
checksums.sha256 ADDED
@@ -0,0 +1 @@
 
 
1
+ 880711fa03577363e6c1b1b6e9321f130ea1a53d5c065d92e1abd8a431bad6be coreml/SenseVoiceSmall.mlmodelc.zip
config.json ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "SenseVoiceSmall-coreml",
3
+ "upstream": {
4
+ "model": "FunAudioLLM/SenseVoiceSmall",
5
+ "code": "https://github.com/FunAudioLLM/SenseVoice",
6
+ "model_revision": "3eb3b4eeffc2f2dde6051b853983753db33e35c3",
7
+ "code_commit": "b97857e5c807a466d0a062cf84dba9fe38a1d66a",
8
+ "assets": [
9
+ {
10
+ "name": "cmvn_am.mvn",
11
+ "url": "https://modelscope.cn/api/v1/models/iic/SenseVoiceSmall/repo?Revision=master&FilePath=am.mvn",
12
+ "sha256": "29b3c740a2c0cfc6b308126d31d7f265fa2be74f3bb095cd2f143ea970896ae5",
13
+ "bytes": 11203
14
+ },
15
+ {
16
+ "name": "spm",
17
+ "url": "https://modelscope.cn/api/v1/models/iic/SenseVoiceSmall/repo?Revision=master&FilePath=chn_jpn_yue_eng_ko_spectok.bpe.model",
18
+ "sha256": "aa87f86064c3730d799ddf7af3c04659151102cba548bce325cf06ba4da4e6a8",
19
+ "bytes": 377341
20
+ }
21
+ ]
22
+ },
23
+ "artifacts": {
24
+ "coreml_zip": "coreml/SenseVoiceSmall.mlmodelc.zip"
25
+ },
26
+ "coreml": {
27
+ "format": "mlmodelc",
28
+ "inputs": [
29
+ {
30
+ "name": "speech",
31
+ "dtype": "float32",
32
+ "shape": [
33
+ 1,
34
+ "T",
35
+ 560
36
+ ]
37
+ },
38
+ {
39
+ "name": "speech_lengths",
40
+ "dtype": "int32",
41
+ "shape": [
42
+ 1
43
+ ]
44
+ },
45
+ {
46
+ "name": "language",
47
+ "dtype": "int32",
48
+ "shape": [
49
+ 1
50
+ ]
51
+ },
52
+ {
53
+ "name": "textnorm",
54
+ "dtype": "int32",
55
+ "shape": [
56
+ 1
57
+ ]
58
+ }
59
+ ],
60
+ "outputs": [
61
+ {
62
+ "name": "ctc_logits"
63
+ },
64
+ {
65
+ "name": "encoder_out_lens"
66
+ }
67
+ ]
68
+ },
69
+ "decoding": {
70
+ "ctc_blank_id": 0,
71
+ "token_offset": 0
72
+ },
73
+ "notes": [
74
+ "Do not run a single forward pass on extremely long audio; use VAD/chunking."
75
+ ],
76
+ "build": {
77
+ "artifact": "coreml/SenseVoiceSmall.mlmodelc.zip",
78
+ "sha256": "880711fa03577363e6c1b1b6e9321f130ea1a53d5c065d92e1abd8a431bad6be",
79
+ "bytes": 432164139,
80
+ "xcodebuild_version": "Xcode 26.0\nBuild version 17A324"
81
+ }
82
+ }
coreml/SenseVoiceSmall.mlmodelc.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:880711fa03577363e6c1b1b6e9321f130ea1a53d5c065d92e1abd8a431bad6be
3
+ size 432164139