Jarbas commited on
Commit
82ea2f9
·
verified ·
1 Parent(s): d7e2496

Add CoreML export: stt-eu-conformer-ctc-large-coreml-4bit

Browse files
README.md ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - automatic-speech-recognition
5
+ - nemo
6
+ - coreml
7
+ - apple-silicon
8
+ - ovos
9
+ ---
10
+
11
+ # stt-eu-conformer-ctc-large-coreml
12
+
13
+ CoreML export of [HiTZ/stt_eu_conformer_ctc_large](https://huggingface.co/HiTZ/stt_eu_conformer_ctc_large) for Apple Silicon.
14
+
15
+ Exported with [ovos-stt-plugin-coreml](https://github.com/TigreGotico/ovos-stt-plugin-coreml).
16
+
17
+ ## Usage
18
+
19
+ ```python
20
+ from ovos_stt_plugin_coreml import CoremlSTT
21
+ stt = CoremlSTT(config={"repo_id": "OpenVoiceOS/stt-eu-conformer-ctc-large-coreml"})
22
+ ```
metadata.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_id": "HiTZ/stt_eu_conformer_ctc_large",
3
+ "model_type": "ctc",
4
+ "language": "",
5
+ "sample_rate": 16000,
6
+ "max_audio_seconds": 15.0,
7
+ "max_audio_samples": 240000,
8
+ "vocab_size": 256,
9
+ "blank_id": 256,
10
+ "checkpoint": {
11
+ "type": "pretrained",
12
+ "model_id": "HiTZ/stt_eu_conformer_ctc_large"
13
+ },
14
+ "coreml": {
15
+ "compute_precision": "FLOAT32",
16
+ "quantization": "4bit_palettize_kmeans"
17
+ },
18
+ "components": {
19
+ "mel_encoder": {
20
+ "path": "parakeet_mel_encoder.mlpackage",
21
+ "inputs": {
22
+ "audio_signal": [
23
+ 1,
24
+ 240000
25
+ ],
26
+ "audio_length": [
27
+ 1
28
+ ]
29
+ },
30
+ "outputs": {
31
+ "encoder": [
32
+ 1,
33
+ 512,
34
+ 376
35
+ ],
36
+ "encoder_length": [
37
+ 1
38
+ ]
39
+ }
40
+ },
41
+ "ctc_decoder": {
42
+ "path": "parakeet_ctc_decoder.mlpackage",
43
+ "inputs": {
44
+ "encoder": [
45
+ 1,
46
+ 512,
47
+ 376
48
+ ]
49
+ },
50
+ "outputs": {
51
+ "log_probs": [
52
+ 1,
53
+ 376,
54
+ 257
55
+ ]
56
+ }
57
+ }
58
+ }
59
+ }
parakeet_ctc_decoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c56389a10848483a7aa6a4398d95e29ba0c00792e41a6de1ba6136a43cc6cf4
3
+ size 2545
parakeet_ctc_decoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fba4385df7d1613f0c9fcecb76d8049f99fc3c0809d0650bb75c3a88f0b5c6d6
3
+ size 67200
parakeet_ctc_decoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "AF61B19F-CD39-4DFC-B508-8CECA0183E24": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "FB429D97-5D3C-46A0-9AC2-1598F7CE31F4": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "AF61B19F-CD39-4DFC-B508-8CECA0183E24"
18
+ }
parakeet_mel_encoder.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66ef9c76cb1aed10e8506cfd131880d7d7ee6ee4bfce7e17d64c3f7bc7b86f67
3
+ size 1347209
parakeet_mel_encoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83ea10030071ff896cd4fec712c69a8a0731dc2a48a4ab76599eda41513c2cd9
3
+ size 63054272
parakeet_mel_encoder.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "9F69AE1C-6350-404A-A8DE-A43884AB903C": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "D6F710BF-375C-4563-98B3-CDFB161A7D24": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "9F69AE1C-6350-404A-A8DE-A43884AB903C"
18
+ }
quantization_summary.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "parakeet_ctc_decoder": {
3
+ "original_mb": 0.5,
4
+ "4bit_mb": 0.1,
5
+ "compression": 7.54
6
+ },
7
+ "parakeet_mel_encoder": {
8
+ "original_mb": 474.4,
9
+ "4bit_mb": 61.4,
10
+ "compression": 7.72
11
+ }
12
+ }
vocab.json ADDED
@@ -0,0 +1,258 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ "<unk>",
3
+ "a",
4
+ "▁",
5
+ "i",
6
+ "n",
7
+ "r",
8
+ "ko",
9
+ "z",
10
+ "o",
11
+ "u",
12
+ "e",
13
+ "tu",
14
+ "s",
15
+ "l",
16
+ "k",
17
+ "ra",
18
+ "ak",
19
+ "te",
20
+ "▁a",
21
+ "la",
22
+ "ta",
23
+ "t",
24
+ "en",
25
+ "an",
26
+ "ri",
27
+ "▁da",
28
+ "▁eta",
29
+ "▁e",
30
+ "go",
31
+ "ka",
32
+ "re",
33
+ "da",
34
+ "▁ez",
35
+ "in",
36
+ "▁ba",
37
+ "▁i",
38
+ "tzen",
39
+ "gi",
40
+ "le",
41
+ "p",
42
+ "▁du",
43
+ "ki",
44
+ "di",
45
+ "du",
46
+ "▁ga",
47
+ "▁bat",
48
+ "ma",
49
+ "h",
50
+ "de",
51
+ "ek",
52
+ "gu",
53
+ "ro",
54
+ "tza",
55
+ "ur",
56
+ "▁o",
57
+ "to",
58
+ "▁ar",
59
+ "▁bi",
60
+ "▁es",
61
+ "aren",
62
+ "ba",
63
+ "ts",
64
+ "▁zen",
65
+ "▁izan",
66
+ "st",
67
+ "g",
68
+ "tik",
69
+ "ga",
70
+ "ren",
71
+ "era",
72
+ "▁di",
73
+ "ke",
74
+ "ti",
75
+ "▁ere",
76
+ "b",
77
+ "be",
78
+ "ten",
79
+ "▁f",
80
+ "▁er",
81
+ "▁ha",
82
+ "rra",
83
+ "iz",
84
+ "x",
85
+ "m",
86
+ "▁p",
87
+ "▁ho",
88
+ "f",
89
+ "ean",
90
+ "men",
91
+ "zu",
92
+ "etan",
93
+ "▁dira",
94
+ "▁u",
95
+ "▁be",
96
+ "▁z",
97
+ "lde",
98
+ "rri",
99
+ "▁ma",
100
+ "lo",
101
+ "zio",
102
+ "me",
103
+ "rik",
104
+ "▁egin",
105
+ "▁hori",
106
+ "▁sa",
107
+ "tzeko",
108
+ "▁zuen",
109
+ "▁de",
110
+ "lu",
111
+ "ru",
112
+ "tzi",
113
+ "▁har",
114
+ "▁ka",
115
+ "▁ber",
116
+ "pe",
117
+ "▁ditu",
118
+ "▁ze",
119
+ "▁al",
120
+ "si",
121
+ "pa",
122
+ "▁hau",
123
+ "▁jo",
124
+ "▁kon",
125
+ "do",
126
+ "▁bere",
127
+ "tan",
128
+ "▁zi",
129
+ "▁behar",
130
+ "ez",
131
+ "▁horre",
132
+ "▁dago",
133
+ "▁so",
134
+ "▁mi",
135
+ "bo",
136
+ "▁he",
137
+ "bide",
138
+ "▁dute",
139
+ "bi",
140
+ "▁ger",
141
+ "▁lan",
142
+ "▁se",
143
+ "tze",
144
+ "tzea",
145
+ "mo",
146
+ "▁na",
147
+ "ntz",
148
+ "▁pa",
149
+ "▁or",
150
+ "▁in",
151
+ "▁herri",
152
+ "▁oso",
153
+ "▁ni",
154
+ "▁mu",
155
+ "▁no",
156
+ "▁beste",
157
+ "▁den",
158
+ "▁po",
159
+ "▁urte",
160
+ "hi",
161
+ "bil",
162
+ "▁zu",
163
+ "keta",
164
+ "d",
165
+ "▁mo",
166
+ "▁zer",
167
+ "▁erre",
168
+ "▁baina",
169
+ "▁bo",
170
+ "▁nahi",
171
+ "▁ikas",
172
+ "aldi",
173
+ "etako",
174
+ "▁handi",
175
+ "▁ge",
176
+ "▁pro",
177
+ "tasun",
178
+ "ber",
179
+ "c",
180
+ "▁lo",
181
+ "▁ondo",
182
+ "▁dugu",
183
+ "garri",
184
+ "▁jar",
185
+ "itz",
186
+ "▁egun",
187
+ "▁ne",
188
+ "▁guzti",
189
+ "▁lehen",
190
+ "pen",
191
+ "▁ikus",
192
+ "▁egiten",
193
+ "▁esku",
194
+ "txe",
195
+ "▁gai",
196
+ "ekin",
197
+ "▁edo",
198
+ "▁tx",
199
+ "▁bizi",
200
+ "▁berri",
201
+ "▁ziren",
202
+ "▁zuten",
203
+ "▁zituen",
204
+ "▁li",
205
+ "▁aurre",
206
+ "tzaile",
207
+ "▁euskal",
208
+ "▁buru",
209
+ "arekin",
210
+ "▁hiru",
211
+ "▁erabil",
212
+ "▁lau",
213
+ "▁eman",
214
+ "▁gor",
215
+ "▁baino",
216
+ "▁su",
217
+ "▁hasi",
218
+ "txa",
219
+ "▁izen",
220
+ "▁euskara",
221
+ "▁hil",
222
+ "▁bu",
223
+ "▁dituzte",
224
+ "▁nagusi",
225
+ "ehun",
226
+ "▁mundu",
227
+ "▁talde",
228
+ "▁azken",
229
+ "▁hainbat",
230
+ "▁gutxi",
231
+ "▁orain",
232
+ "▁daude",
233
+ "garren",
234
+ "▁hitz",
235
+ "▁elkar",
236
+ "txo",
237
+ "▁batzuk",
238
+ "▁uste",
239
+ "▁hiri",
240
+ "entzia",
241
+ "▁gehien",
242
+ "v",
243
+ "▁gehiago",
244
+ "▁lagun",
245
+ "▁txiki",
246
+ "y",
247
+ "w",
248
+ "▁inguru",
249
+ "▁emakume",
250
+ "▁nuen",
251
+ "▁liburu",
252
+ "▁jende",
253
+ "▁hizkuntza",
254
+ "▁ahal",
255
+ "q",
256
+ "ñ",
257
+ "j"
258
+ ]