aufklarer commited on
Commit
4298b54
·
verified ·
1 Parent(s): d4055fc

6-model ANE architecture: TextProjector, CodeEmbedder, MultiCodeEmbedder, CodeDecoder, MultiCodeDecoder, SpeechDecoder + speaker embedding

Browse files
Files changed (41) hide show
  1. {CodePredictor.mlmodelc → CodeDecoder.mlmodelc}/analytics/coremldata.bin +1 -1
  2. {MimiDecoder.mlmodelc → CodeDecoder.mlmodelc}/coremldata.bin +2 -2
  3. {Talker.mlmodelc → CodeDecoder.mlmodelc}/metadata.json +28 -37
  4. CodeDecoder.mlmodelc/model.mil +0 -0
  5. {MimiDecoder.mlmodelc → CodeDecoder.mlmodelc}/weights/weight.bin +2 -2
  6. {Talker.mlmodelc → CodeEmbedder.mlmodelc}/analytics/coremldata.bin +1 -1
  7. CodeEmbedder.mlmodelc/coremldata.bin +3 -0
  8. CodeEmbedder.mlmodelc/metadata.json +67 -0
  9. CodeEmbedder.mlmodelc/model.mil +29 -0
  10. CodeEmbedder.mlmodelc/weights/weight.bin +3 -0
  11. CodePredictor.mlmodelc/metadata.json +0 -328
  12. CodePredictor.mlmodelc/model.mil +0 -0
  13. MimiDecoder.mlmodelc/model.mil +0 -0
  14. {MimiDecoder.mlmodelc → MultiCodeDecoder.mlmodelc}/analytics/coremldata.bin +1 -1
  15. MultiCodeDecoder.mlmodelc/coremldata.bin +3 -0
  16. MultiCodeDecoder.mlmodelc/metadata.json +162 -0
  17. MultiCodeDecoder.mlmodelc/model.mil +0 -0
  18. {Talker.mlmodelc → MultiCodeDecoder.mlmodelc}/weights/weight.bin +2 -2
  19. MultiCodeEmbedder.mlmodelc/analytics/coremldata.bin +3 -0
  20. MultiCodeEmbedder.mlmodelc/coremldata.bin +3 -0
  21. MultiCodeEmbedder.mlmodelc/metadata.json +67 -0
  22. MultiCodeEmbedder.mlmodelc/model.mil +29 -0
  23. MultiCodeEmbedder.mlmodelc/weights/weight.bin +3 -0
  24. SpeechDecoder.mlmodelc/analytics/coremldata.bin +3 -0
  25. SpeechDecoder.mlmodelc/coremldata.bin +3 -0
  26. {MimiDecoder.mlmodelc → SpeechDecoder.mlmodelc}/metadata.json +24 -27
  27. SpeechDecoder.mlmodelc/model.mil +0 -0
  28. {CodePredictor.mlmodelc → SpeechDecoder.mlmodelc}/weights/weight.bin +2 -2
  29. Talker.mlmodelc/coremldata.bin +0 -3
  30. Talker.mlmodelc/model.mil +0 -0
  31. TextProjector.mlmodelc/analytics/coremldata.bin +3 -0
  32. TextProjector.mlmodelc/coremldata.bin +3 -0
  33. TextProjector.mlmodelc/metadata.json +69 -0
  34. TextProjector.mlmodelc/model.mil +35 -0
  35. TextProjector.mlmodelc/weights/weight.bin +3 -0
  36. config.json +14 -10
  37. embeddings.safetensors +0 -3
  38. CodePredictor.mlmodelc/coremldata.bin → speaker_embedding.npy +2 -2
  39. tts_bos_embed.npy +3 -0
  40. tts_eos_embed.npy +3 -0
  41. tts_pad_embed.npy +3 -0
{CodePredictor.mlmodelc → CodeDecoder.mlmodelc}/analytics/coremldata.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19727f665522e27ea6d1a551f82df935419b51e9b060af76ee1622837d1b80f1
3
  size 243
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f73b5cb1ea58da1354e9693a58de02d8313261cd34868b6b5bac0cf4830f091c
3
  size 243
{MimiDecoder.mlmodelc → CodeDecoder.mlmodelc}/coremldata.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38a4d9c02d6c4d443b13335769dd6ffa1ad88ac64b7799e11098910b4652e734
3
- size 399
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae57abaa76c7566ec6ec30e316d1408fa75e1af208d630a552d0d66b4a260f68
3
+ size 642
{Talker.mlmodelc → CodeDecoder.mlmodelc}/metadata.json RENAMED
@@ -1,15 +1,15 @@
1
  [
2
  {
3
  "metadataOutputVersion" : "3.0",
4
- "storagePrecision" : "Mixed (Float16, Int32, Palettized (8 bits), UInt8)",
5
  "outputSchema" : [
6
  {
7
  "hasShapeFlexibility" : "0",
8
  "isOptional" : "0",
9
  "dataType" : "Float16",
10
- "formattedType" : "MultiArray (Float16 1 × 3072)",
11
  "shortDescription" : "",
12
- "shape" : "[1, 3072]",
13
  "name" : "logits",
14
  "type" : "MultiArray"
15
  },
@@ -27,20 +27,20 @@
27
  "hasShapeFlexibility" : "0",
28
  "isOptional" : "0",
29
  "dataType" : "Float16",
30
- "formattedType" : "MultiArray (Float16 1 × 28672 × 1 × 1)",
31
  "shortDescription" : "",
32
- "shape" : "[1, 28672, 1, 1]",
33
- "name" : "key_cache_updates",
34
  "type" : "MultiArray"
35
  },
36
  {
37
  "hasShapeFlexibility" : "0",
38
  "isOptional" : "0",
39
  "dataType" : "Float16",
40
- "formattedType" : "MultiArray (Float16 1 × 28672 × 1 × 1)",
41
  "shortDescription" : "",
42
- "shape" : "[1, 28672, 1, 1]",
43
- "name" : "value_cache_updates",
44
  "type" : "MultiArray"
45
  }
46
  ],
@@ -49,26 +49,27 @@
49
  ],
50
  "specificationVersion" : 9,
51
  "mlProgramOperationTypeHistogram" : {
52
- "Ios18.expandDims" : 6,
53
  "Ios18.softmax" : 28,
54
- "Ios18.mul" : 618,
55
- "Ios18.matmul" : 56,
 
56
  "Ios18.rsqrt" : 113,
57
  "Ios16.reduceMean" : 113,
58
- "Split" : 2,
59
  "Tile" : 56,
60
- "Ios18.add" : 309,
61
- "Ios16.reduceSum" : 56,
62
- "Ios18.reshape" : 336,
63
  "Ios18.constexprLutToDense" : 197,
64
- "Ios18.conv" : 197,
65
- "Ios18.concat" : 58,
66
- "Ios18.transpose" : 168,
67
  "Ios18.sub" : 1,
68
  "Ios18.pow" : 113,
 
69
  "Ios18.silu" : 28,
70
- "Ios18.squeeze" : 2,
71
- "Ios18.sliceByIndex" : 112
72
  },
73
  "computePrecision" : "Mixed (Float16, Float32, Int32)",
74
  "isUpdatable" : "0",
@@ -87,7 +88,7 @@
87
  "name" : "MLModelType_mlProgram"
88
  },
89
  "userDefinedMetadata" : {
90
- "com.github.apple.coremltools.conversion_date" : "2026-03-29",
91
  "com.github.apple.coremltools.source" : "torch==2.10.0",
92
  "com.github.apple.coremltools.version" : "9.0",
93
  "com.github.apple.coremltools.source_dialect" : "TorchScript"
@@ -106,21 +107,11 @@
106
  {
107
  "hasShapeFlexibility" : "0",
108
  "isOptional" : "0",
109
- "dataType" : "Float16",
110
- "formattedType" : "MultiArray (Float16 1 × 128 × 1)",
111
- "shortDescription" : "",
112
- "shape" : "[1, 128, 1]",
113
- "name" : "rope_cos",
114
- "type" : "MultiArray"
115
- },
116
- {
117
- "hasShapeFlexibility" : "0",
118
- "isOptional" : "0",
119
- "dataType" : "Float16",
120
- "formattedType" : "MultiArray (Float16 1 × 128 × 1)",
121
  "shortDescription" : "",
122
- "shape" : "[1, 128, 1]",
123
- "name" : "rope_sin",
124
  "type" : "MultiArray"
125
  },
126
  {
@@ -164,7 +155,7 @@
164
  "type" : "MultiArray"
165
  }
166
  ],
167
- "generatedClassName" : "Talker",
168
  "method" : "predict"
169
  }
170
  ]
 
1
  [
2
  {
3
  "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Mixed (Float16, Palettized (8 bits), UInt8)",
5
  "outputSchema" : [
6
  {
7
  "hasShapeFlexibility" : "0",
8
  "isOptional" : "0",
9
  "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
11
  "shortDescription" : "",
12
+ "shape" : "[1, 1, 3072]",
13
  "name" : "logits",
14
  "type" : "MultiArray"
15
  },
 
27
  "hasShapeFlexibility" : "0",
28
  "isOptional" : "0",
29
  "dataType" : "Float16",
30
+ "formattedType" : "MultiArray (Float16 1 × 28672 × 1 × 256)",
31
  "shortDescription" : "",
32
+ "shape" : "[1, 28672, 1, 256]",
33
+ "name" : "new_key_cache",
34
  "type" : "MultiArray"
35
  },
36
  {
37
  "hasShapeFlexibility" : "0",
38
  "isOptional" : "0",
39
  "dataType" : "Float16",
40
+ "formattedType" : "MultiArray (Float16 1 × 28672 × 1 × 256)",
41
  "shortDescription" : "",
42
+ "shape" : "[1, 28672, 1, 256]",
43
+ "name" : "new_value_cache",
44
  "type" : "MultiArray"
45
  }
46
  ],
 
49
  ],
50
  "specificationVersion" : 9,
51
  "mlProgramOperationTypeHistogram" : {
52
+ "Ios18.expandDims" : 235,
53
  "Ios18.softmax" : 28,
54
+ "Ios18.cos" : 1,
55
+ "Ios18.mul" : 566,
56
+ "Ios18.matmul" : 57,
57
  "Ios18.rsqrt" : 113,
58
  "Ios16.reduceMean" : 113,
59
+ "Ios18.sin" : 1,
60
  "Tile" : 56,
61
+ "Ios18.add" : 311,
62
+ "Ios18.reshape" : 252,
 
63
  "Ios18.constexprLutToDense" : 197,
64
+ "Ios18.linear" : 197,
65
+ "Ios18.concat" : 59,
66
+ "Ios18.transpose" : 57,
67
  "Ios18.sub" : 1,
68
  "Ios18.pow" : 113,
69
+ "Ios18.cast" : 1,
70
  "Ios18.silu" : 28,
71
+ "Ios18.sliceByIndex" : 168,
72
+ "Ios18.squeeze" : 283
73
  },
74
  "computePrecision" : "Mixed (Float16, Float32, Int32)",
75
  "isUpdatable" : "0",
 
88
  "name" : "MLModelType_mlProgram"
89
  },
90
  "userDefinedMetadata" : {
91
+ "com.github.apple.coremltools.conversion_date" : "2026-03-30",
92
  "com.github.apple.coremltools.source" : "torch==2.10.0",
93
  "com.github.apple.coremltools.version" : "9.0",
94
  "com.github.apple.coremltools.source_dialect" : "TorchScript"
 
107
  {
108
  "hasShapeFlexibility" : "0",
109
  "isOptional" : "0",
110
+ "dataType" : "Int32",
111
+ "formattedType" : "MultiArray (Int32 1)",
 
 
 
 
 
 
 
 
 
 
112
  "shortDescription" : "",
113
+ "shape" : "[1]",
114
+ "name" : "cache_length",
115
  "type" : "MultiArray"
116
  },
117
  {
 
155
  "type" : "MultiArray"
156
  }
157
  ],
158
+ "generatedClassName" : "CodeDecoder",
159
  "method" : "predict"
160
  }
161
  ]
CodeDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
{MimiDecoder.mlmodelc → CodeDecoder.mlmodelc}/weights/weight.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:202b1d7b254ee9496615d236ef280d4dae2966ad54d2a13fdebbe2c4c684b958
3
- size 228181632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e3442b2ae6df9cc1d3942018bdd6622d174798b265355bc8003226a15068b4
3
+ size 443824768
{Talker.mlmodelc → CodeEmbedder.mlmodelc}/analytics/coremldata.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff24977af0106176ba5e5526c8b1a451d42597675c7e5b3c50f303c9913db6bd
3
  size 243
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:602128d98154e1cab615ea7fe218dd91acd52338868d29fe4c1140535e22b851
3
  size 243
CodeEmbedder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b27307e3f1f9f5ef310e6fc7ee27ec3d69428c438b77720e86b5a1cb5bfa9919
3
+ size 380
CodeEmbedder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Float16",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1024 × 1 × 1)",
11
+ "shortDescription" : "",
12
+ "shape" : "[1024, 1, 1]",
13
+ "name" : "input_embeds",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 9,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Select" : 1,
23
+ "Ios18.squeeze" : 2,
24
+ "Ios18.gather" : 1,
25
+ "Ios18.expandDims" : 2,
26
+ "Ios18.cast" : 3,
27
+ "Ios18.greaterEqual" : 1,
28
+ "Ios18.add" : 1
29
+ },
30
+ "computePrecision" : "Mixed (Float16, Int16, Int32)",
31
+ "isUpdatable" : "0",
32
+ "stateSchema" : [
33
+
34
+ ],
35
+ "availability" : {
36
+ "macOS" : "15.0",
37
+ "tvOS" : "18.0",
38
+ "visionOS" : "2.0",
39
+ "watchOS" : "11.0",
40
+ "iOS" : "18.0",
41
+ "macCatalyst" : "18.0"
42
+ },
43
+ "modelType" : {
44
+ "name" : "MLModelType_mlProgram"
45
+ },
46
+ "userDefinedMetadata" : {
47
+ "com.github.apple.coremltools.conversion_date" : "2026-03-30",
48
+ "com.github.apple.coremltools.source" : "torch==2.10.0",
49
+ "com.github.apple.coremltools.version" : "9.0",
50
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
51
+ },
52
+ "inputSchema" : [
53
+ {
54
+ "hasShapeFlexibility" : "0",
55
+ "isOptional" : "0",
56
+ "dataType" : "Int32",
57
+ "formattedType" : "MultiArray (Int32 1)",
58
+ "shortDescription" : "",
59
+ "shape" : "[1]",
60
+ "name" : "input_ids",
61
+ "type" : "MultiArray"
62
+ }
63
+ ],
64
+ "generatedClassName" : "CodeEmbedder",
65
+ "method" : "predict"
66
+ }
67
+ ]
CodeEmbedder.mlmodelc/model.mil ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ program(1.3)
2
+ [buildInfo = dict<string, string>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.10.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})]
3
+ {
4
+ func main<ios18>(tensor<int32, [1]> input_ids) {
5
+ int32 emb_batch_dims_0 = const()[name = string("emb_batch_dims_0"), val = int32(0)];
6
+ bool emb_validate_indices_0 = const()[name = string("emb_validate_indices_0"), val = bool(false)];
7
+ tensor<fp16, [3072, 1024]> codec_embedding_weight_to_fp16 = const()[name = string("codec_embedding_weight_to_fp16"), val = tensor<fp16, [3072, 1024]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64)))];
8
+ string input_ids_to_int16_dtype_0 = const()[name = string("input_ids_to_int16_dtype_0"), val = string("int16")];
9
+ string cast_2_dtype_0 = const()[name = string("cast_2_dtype_0"), val = string("int32")];
10
+ int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)];
11
+ tensor<int16, [1]> input_ids_to_int16 = cast(dtype = input_ids_to_int16_dtype_0, x = input_ids)[name = string("cast_5")];
12
+ tensor<int32, [1]> cast_2 = cast(dtype = cast_2_dtype_0, x = input_ids_to_int16)[name = string("cast_4")];
13
+ tensor<bool, [1]> greater_equal_0 = greater_equal(x = cast_2, y = greater_equal_0_y_0)[name = string("greater_equal_0")];
14
+ int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(3072)];
15
+ tensor<int32, [1]> add_0 = add(x = cast_2, y = slice_by_index_0)[name = string("add_0")];
16
+ tensor<int32, [1]> select_0 = select(a = cast_2, b = add_0, cond = greater_equal_0)[name = string("select_0")];
17
+ int32 emb_cast_fp16_cast_uint16_axis_0 = const()[name = string("emb_cast_fp16_cast_uint16_axis_0"), val = int32(0)];
18
+ string select_0_to_int16_dtype_0 = const()[name = string("select_0_to_int16_dtype_0"), val = string("int16")];
19
+ tensor<int16, [1]> select_0_to_int16 = cast(dtype = select_0_to_int16_dtype_0, x = select_0)[name = string("cast_3")];
20
+ tensor<fp16, [1, 1024]> emb_cast_fp16_cast_uint16_cast_uint16 = gather(axis = emb_cast_fp16_cast_uint16_axis_0, batch_dims = emb_batch_dims_0, indices = select_0_to_int16, validate_indices = emb_validate_indices_0, x = codec_embedding_weight_to_fp16)[name = string("emb_cast_fp16_cast_uint16_cast_uint16")];
21
+ tensor<int32, [1]> var_8_axes_0 = const()[name = string("op_8_axes_0"), val = tensor<int32, [1]>([0])];
22
+ tensor<fp16, [1024]> var_8_cast_fp16 = squeeze(axes = var_8_axes_0, x = emb_cast_fp16_cast_uint16_cast_uint16)[name = string("op_8_cast_fp16")];
23
+ tensor<fp16, [1024]> var_10_cast_fp16 = squeeze(x = var_8_cast_fp16)[name = string("op_10_cast_fp16")];
24
+ tensor<int32, [1]> var_12_axes_0 = const()[name = string("op_12_axes_0"), val = tensor<int32, [1]>([-1])];
25
+ tensor<fp16, [1024, 1]> var_12_cast_fp16 = expand_dims(axes = var_12_axes_0, x = var_10_cast_fp16)[name = string("op_12_cast_fp16")];
26
+ tensor<int32, [1]> var_14_axes_0 = const()[name = string("op_14_axes_0"), val = tensor<int32, [1]>([-1])];
27
+ tensor<fp16, [1024, 1, 1]> input_embeds = expand_dims(axes = var_14_axes_0, x = var_12_cast_fp16)[name = string("op_14_cast_fp16")];
28
+ } -> (input_embeds);
29
+ }
CodeEmbedder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc523d30a88406fc4988b3e523cddba01b004a688071591be1db81e3abe0830b
3
+ size 6291584
CodePredictor.mlmodelc/metadata.json DELETED
@@ -1,328 +0,0 @@
1
- [
2
- {
3
- "metadataOutputVersion" : "3.0",
4
- "storagePrecision" : "Float32",
5
- "outputSchema" : [
6
- {
7
- "hasShapeFlexibility" : "0",
8
- "isOptional" : "0",
9
- "dataType" : "Float32",
10
- "formattedType" : "MultiArray (Float32 1 × 1 × 1024)",
11
- "shortDescription" : "",
12
- "shape" : "[1, 1, 1024]",
13
- "name" : "hidden_states",
14
- "type" : "MultiArray"
15
- },
16
- {
17
- "hasShapeFlexibility" : "0",
18
- "isOptional" : "0",
19
- "dataType" : "Float32",
20
- "formattedType" : "MultiArray (Float32)",
21
- "shortDescription" : "",
22
- "shape" : "[]",
23
- "name" : "layer_0_key_cache_out",
24
- "type" : "MultiArray"
25
- },
26
- {
27
- "hasShapeFlexibility" : "0",
28
- "isOptional" : "0",
29
- "dataType" : "Float32",
30
- "formattedType" : "MultiArray (Float32)",
31
- "shortDescription" : "",
32
- "shape" : "[]",
33
- "name" : "layer_0_value_cache_out",
34
- "type" : "MultiArray"
35
- },
36
- {
37
- "hasShapeFlexibility" : "0",
38
- "isOptional" : "0",
39
- "dataType" : "Float32",
40
- "formattedType" : "MultiArray (Float32)",
41
- "shortDescription" : "",
42
- "shape" : "[]",
43
- "name" : "layer_1_key_cache_out",
44
- "type" : "MultiArray"
45
- },
46
- {
47
- "hasShapeFlexibility" : "0",
48
- "isOptional" : "0",
49
- "dataType" : "Float32",
50
- "formattedType" : "MultiArray (Float32)",
51
- "shortDescription" : "",
52
- "shape" : "[]",
53
- "name" : "layer_1_value_cache_out",
54
- "type" : "MultiArray"
55
- },
56
- {
57
- "hasShapeFlexibility" : "0",
58
- "isOptional" : "0",
59
- "dataType" : "Float32",
60
- "formattedType" : "MultiArray (Float32)",
61
- "shortDescription" : "",
62
- "shape" : "[]",
63
- "name" : "layer_2_key_cache_out",
64
- "type" : "MultiArray"
65
- },
66
- {
67
- "hasShapeFlexibility" : "0",
68
- "isOptional" : "0",
69
- "dataType" : "Float32",
70
- "formattedType" : "MultiArray (Float32)",
71
- "shortDescription" : "",
72
- "shape" : "[]",
73
- "name" : "layer_2_value_cache_out",
74
- "type" : "MultiArray"
75
- },
76
- {
77
- "hasShapeFlexibility" : "0",
78
- "isOptional" : "0",
79
- "dataType" : "Float32",
80
- "formattedType" : "MultiArray (Float32)",
81
- "shortDescription" : "",
82
- "shape" : "[]",
83
- "name" : "layer_3_key_cache_out",
84
- "type" : "MultiArray"
85
- },
86
- {
87
- "hasShapeFlexibility" : "0",
88
- "isOptional" : "0",
89
- "dataType" : "Float32",
90
- "formattedType" : "MultiArray (Float32)",
91
- "shortDescription" : "",
92
- "shape" : "[]",
93
- "name" : "layer_3_value_cache_out",
94
- "type" : "MultiArray"
95
- },
96
- {
97
- "hasShapeFlexibility" : "0",
98
- "isOptional" : "0",
99
- "dataType" : "Float32",
100
- "formattedType" : "MultiArray (Float32)",
101
- "shortDescription" : "",
102
- "shape" : "[]",
103
- "name" : "layer_4_key_cache_out",
104
- "type" : "MultiArray"
105
- },
106
- {
107
- "hasShapeFlexibility" : "0",
108
- "isOptional" : "0",
109
- "dataType" : "Float32",
110
- "formattedType" : "MultiArray (Float32)",
111
- "shortDescription" : "",
112
- "shape" : "[]",
113
- "name" : "layer_4_value_cache_out",
114
- "type" : "MultiArray"
115
- }
116
- ],
117
- "modelParameters" : [
118
-
119
- ],
120
- "specificationVersion" : 9,
121
- "mlProgramOperationTypeHistogram" : {
122
- "Ios18.expandDims" : 3,
123
- "Ios18.softmax" : 5,
124
- "Ios18.cos" : 1,
125
- "Ios18.mul" : 93,
126
- "Ios18.matmul" : 10,
127
- "Ios18.rsqrt" : 21,
128
- "Identity" : 1,
129
- "Ios16.reduceMean" : 21,
130
- "Ios18.sin" : 1,
131
- "Tile" : 10,
132
- "Ios18.gather" : 5,
133
- "Ios18.add" : 46,
134
- "Ios18.reshape" : 40,
135
- "Shape" : 5,
136
- "Ios18.linear" : 35,
137
- "Ios18.concat" : 25,
138
- "Ios18.cast" : 1,
139
- "Ios18.sub" : 10,
140
- "Ios18.pow" : 21,
141
- "Ios18.transpose" : 50,
142
- "Ios18.silu" : 5,
143
- "Ios18.sliceByIndex" : 21
144
- },
145
- "computePrecision" : "Mixed (Float32, Int32)",
146
- "isUpdatable" : "0",
147
- "stateSchema" : [
148
-
149
- ],
150
- "availability" : {
151
- "macOS" : "15.0",
152
- "tvOS" : "18.0",
153
- "visionOS" : "2.0",
154
- "watchOS" : "11.0",
155
- "iOS" : "18.0",
156
- "macCatalyst" : "18.0"
157
- },
158
- "modelType" : {
159
- "name" : "MLModelType_mlProgram"
160
- },
161
- "userDefinedMetadata" : {
162
- "com.github.apple.coremltools.conversion_date" : "2026-03-29",
163
- "com.github.apple.coremltools.source" : "torch==2.10.0",
164
- "com.github.apple.coremltools.version" : "9.0",
165
- "com.github.apple.coremltools.source_dialect" : "TorchScript"
166
- },
167
- "inputSchema" : [
168
- {
169
- "dataType" : "Float32",
170
- "hasShapeFlexibility" : "1",
171
- "isOptional" : "0",
172
- "shapeFlexibility" : "1 × 1...20 × 1024",
173
- "shapeRange" : "[[1, 1], [1, 20], [1024, 1024]]",
174
- "formattedType" : "MultiArray (Float32 1 × 1 × 1024)",
175
- "type" : "MultiArray",
176
- "shape" : "[1, 1, 1024]",
177
- "name" : "input_embeds",
178
- "shortDescription" : ""
179
- },
180
- {
181
- "dataType" : "Int32",
182
- "hasShapeFlexibility" : "1",
183
- "isOptional" : "0",
184
- "shapeFlexibility" : "1 × 1...20",
185
- "shapeRange" : "[[1, 1], [1, 20]]",
186
- "formattedType" : "MultiArray (Int32 1 × 1)",
187
- "type" : "MultiArray",
188
- "shape" : "[1, 1]",
189
- "name" : "position_ids",
190
- "shortDescription" : ""
191
- },
192
- {
193
- "dataType" : "Float32",
194
- "hasShapeFlexibility" : "1",
195
- "isOptional" : "0",
196
- "shapeFlexibility" : "1 × 1 × 1...20 × 1...21",
197
- "shapeRange" : "[[1, 1], [1, 1], [1, 20], [1, 21]]",
198
- "formattedType" : "MultiArray (Float32 1 × 1 × 1 × 1)",
199
- "type" : "MultiArray",
200
- "shape" : "[1, 1, 1, 1]",
201
- "name" : "causal_mask",
202
- "shortDescription" : ""
203
- },
204
- {
205
- "dataType" : "Float32",
206
- "hasShapeFlexibility" : "1",
207
- "isOptional" : "0",
208
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
209
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
210
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
211
- "type" : "MultiArray",
212
- "shape" : "[1, 8, 1, 128]",
213
- "name" : "layer_0_key_cache",
214
- "shortDescription" : ""
215
- },
216
- {
217
- "dataType" : "Float32",
218
- "hasShapeFlexibility" : "1",
219
- "isOptional" : "0",
220
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
221
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
222
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
223
- "type" : "MultiArray",
224
- "shape" : "[1, 8, 1, 128]",
225
- "name" : "layer_0_value_cache",
226
- "shortDescription" : ""
227
- },
228
- {
229
- "dataType" : "Float32",
230
- "hasShapeFlexibility" : "1",
231
- "isOptional" : "0",
232
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
233
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
234
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
235
- "type" : "MultiArray",
236
- "shape" : "[1, 8, 1, 128]",
237
- "name" : "layer_1_key_cache",
238
- "shortDescription" : ""
239
- },
240
- {
241
- "dataType" : "Float32",
242
- "hasShapeFlexibility" : "1",
243
- "isOptional" : "0",
244
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
245
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
246
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
247
- "type" : "MultiArray",
248
- "shape" : "[1, 8, 1, 128]",
249
- "name" : "layer_1_value_cache",
250
- "shortDescription" : ""
251
- },
252
- {
253
- "dataType" : "Float32",
254
- "hasShapeFlexibility" : "1",
255
- "isOptional" : "0",
256
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
257
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
258
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
259
- "type" : "MultiArray",
260
- "shape" : "[1, 8, 1, 128]",
261
- "name" : "layer_2_key_cache",
262
- "shortDescription" : ""
263
- },
264
- {
265
- "dataType" : "Float32",
266
- "hasShapeFlexibility" : "1",
267
- "isOptional" : "0",
268
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
269
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
270
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
271
- "type" : "MultiArray",
272
- "shape" : "[1, 8, 1, 128]",
273
- "name" : "layer_2_value_cache",
274
- "shortDescription" : ""
275
- },
276
- {
277
- "dataType" : "Float32",
278
- "hasShapeFlexibility" : "1",
279
- "isOptional" : "0",
280
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
281
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
282
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
283
- "type" : "MultiArray",
284
- "shape" : "[1, 8, 1, 128]",
285
- "name" : "layer_3_key_cache",
286
- "shortDescription" : ""
287
- },
288
- {
289
- "dataType" : "Float32",
290
- "hasShapeFlexibility" : "1",
291
- "isOptional" : "0",
292
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
293
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
294
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
295
- "type" : "MultiArray",
296
- "shape" : "[1, 8, 1, 128]",
297
- "name" : "layer_3_value_cache",
298
- "shortDescription" : ""
299
- },
300
- {
301
- "dataType" : "Float32",
302
- "hasShapeFlexibility" : "1",
303
- "isOptional" : "0",
304
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
305
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
306
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
307
- "type" : "MultiArray",
308
- "shape" : "[1, 8, 1, 128]",
309
- "name" : "layer_4_key_cache",
310
- "shortDescription" : ""
311
- },
312
- {
313
- "dataType" : "Float32",
314
- "hasShapeFlexibility" : "1",
315
- "isOptional" : "0",
316
- "shapeFlexibility" : "1 × 8 × 1...20 × 128",
317
- "shapeRange" : "[[1, 1], [8, 8], [1, 20], [128, 128]]",
318
- "formattedType" : "MultiArray (Float32 1 × 8 × 1 × 128)",
319
- "type" : "MultiArray",
320
- "shape" : "[1, 8, 1, 128]",
321
- "name" : "layer_4_value_cache",
322
- "shortDescription" : ""
323
- }
324
- ],
325
- "generatedClassName" : "CodePredictor",
326
- "method" : "predict"
327
- }
328
- ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
CodePredictor.mlmodelc/model.mil DELETED
The diff for this file is too large to render. See raw diff
 
MimiDecoder.mlmodelc/model.mil DELETED
The diff for this file is too large to render. See raw diff
 
{MimiDecoder.mlmodelc → MultiCodeDecoder.mlmodelc}/analytics/coremldata.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a4f8fad96e23cd81374cff387bd5a1860e54eaa2bc9df0f41238e3a67c92ea2
3
  size 243
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e732fb4ad346cd6a1db697a4d94a0441850902701e0767a7cdaebaa9de1abc88
3
  size 243
MultiCodeDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d491845bb47ba5f76ee40491f3c1824d4a1f30ec2675daa19d64b97a59c65fe7
3
+ size 636
MultiCodeDecoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Mixed (Float32, Palettized (8 bits), UInt8)",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1 × 15 × 2048)",
11
+ "shortDescription" : "",
12
+ "shape" : "[1, 15, 2048]",
13
+ "name" : "all_logits",
14
+ "type" : "MultiArray"
15
+ },
16
+ {
17
+ "hasShapeFlexibility" : "0",
18
+ "isOptional" : "0",
19
+ "dataType" : "Float16",
20
+ "formattedType" : "MultiArray (Float16 1 × 1024 × 1 × 1)",
21
+ "shortDescription" : "",
22
+ "shape" : "[1, 1024, 1, 1]",
23
+ "name" : "hidden_states",
24
+ "type" : "MultiArray"
25
+ },
26
+ {
27
+ "hasShapeFlexibility" : "0",
28
+ "isOptional" : "0",
29
+ "dataType" : "Float16",
30
+ "formattedType" : "MultiArray (Float16 1 × 5120 × 1 × 16)",
31
+ "shortDescription" : "",
32
+ "shape" : "[1, 5120, 1, 16]",
33
+ "name" : "new_key_cache",
34
+ "type" : "MultiArray"
35
+ },
36
+ {
37
+ "hasShapeFlexibility" : "0",
38
+ "isOptional" : "0",
39
+ "dataType" : "Float16",
40
+ "formattedType" : "MultiArray (Float16 1 × 5120 × 1 × 16)",
41
+ "shortDescription" : "",
42
+ "shape" : "[1, 5120, 1, 16]",
43
+ "name" : "new_value_cache",
44
+ "type" : "MultiArray"
45
+ }
46
+ ],
47
+ "modelParameters" : [
48
+
49
+ ],
50
+ "specificationVersion" : 9,
51
+ "mlProgramOperationTypeHistogram" : {
52
+ "Ios18.expandDims" : 51,
53
+ "Ios18.softmax" : 5,
54
+ "Ios18.cos" : 1,
55
+ "Ios18.mul" : 106,
56
+ "Ios18.matmul" : 11,
57
+ "Ios18.rsqrt" : 21,
58
+ "Ios16.reduceMean" : 21,
59
+ "Ios18.sin" : 1,
60
+ "Tile" : 10,
61
+ "Ios18.add" : 58,
62
+ "Ios18.reshape" : 45,
63
+ "Ios18.constexprLutToDense" : 50,
64
+ "Ios18.linear" : 50,
65
+ "Ios18.concat" : 13,
66
+ "Ios18.transpose" : 11,
67
+ "Ios18.sub" : 1,
68
+ "Ios18.pow" : 21,
69
+ "Ios18.cast" : 10,
70
+ "Ios18.silu" : 5,
71
+ "Stack" : 1,
72
+ "Ios18.sliceByIndex" : 30,
73
+ "Ios18.squeeze" : 68
74
+ },
75
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
76
+ "isUpdatable" : "0",
77
+ "stateSchema" : [
78
+
79
+ ],
80
+ "availability" : {
81
+ "macOS" : "15.0",
82
+ "tvOS" : "18.0",
83
+ "visionOS" : "2.0",
84
+ "watchOS" : "11.0",
85
+ "iOS" : "18.0",
86
+ "macCatalyst" : "18.0"
87
+ },
88
+ "modelType" : {
89
+ "name" : "MLModelType_mlProgram"
90
+ },
91
+ "userDefinedMetadata" : {
92
+ "com.github.apple.coremltools.conversion_date" : "2026-03-30",
93
+ "com.github.apple.coremltools.source" : "torch==2.10.0",
94
+ "com.github.apple.coremltools.version" : "9.0",
95
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
96
+ },
97
+ "inputSchema" : [
98
+ {
99
+ "hasShapeFlexibility" : "0",
100
+ "isOptional" : "0",
101
+ "dataType" : "Float16",
102
+ "formattedType" : "MultiArray (Float16 1 × 1024 × 1 × 1)",
103
+ "shortDescription" : "",
104
+ "shape" : "[1, 1024, 1, 1]",
105
+ "name" : "input_embeds",
106
+ "type" : "MultiArray"
107
+ },
108
+ {
109
+ "hasShapeFlexibility" : "0",
110
+ "isOptional" : "0",
111
+ "dataType" : "Int32",
112
+ "formattedType" : "MultiArray (Int32 1)",
113
+ "shortDescription" : "",
114
+ "shape" : "[1]",
115
+ "name" : "cache_length",
116
+ "type" : "MultiArray"
117
+ },
118
+ {
119
+ "hasShapeFlexibility" : "0",
120
+ "isOptional" : "0",
121
+ "dataType" : "Float16",
122
+ "formattedType" : "MultiArray (Float16 1 × 5120 × 1 × 16)",
123
+ "shortDescription" : "",
124
+ "shape" : "[1, 5120, 1, 16]",
125
+ "name" : "key_cache",
126
+ "type" : "MultiArray"
127
+ },
128
+ {
129
+ "hasShapeFlexibility" : "0",
130
+ "isOptional" : "0",
131
+ "dataType" : "Float16",
132
+ "formattedType" : "MultiArray (Float16 1 × 16)",
133
+ "shortDescription" : "",
134
+ "shape" : "[1, 16]",
135
+ "name" : "key_padding_mask",
136
+ "type" : "MultiArray"
137
+ },
138
+ {
139
+ "hasShapeFlexibility" : "0",
140
+ "isOptional" : "0",
141
+ "dataType" : "Float16",
142
+ "formattedType" : "MultiArray (Float16 1 × 16)",
143
+ "shortDescription" : "",
144
+ "shape" : "[1, 16]",
145
+ "name" : "kv_cache_update_mask",
146
+ "type" : "MultiArray"
147
+ },
148
+ {
149
+ "hasShapeFlexibility" : "0",
150
+ "isOptional" : "0",
151
+ "dataType" : "Float16",
152
+ "formattedType" : "MultiArray (Float16 1 × 5120 × 1 × 16)",
153
+ "shortDescription" : "",
154
+ "shape" : "[1, 5120, 1, 16]",
155
+ "name" : "value_cache",
156
+ "type" : "MultiArray"
157
+ }
158
+ ],
159
+ "generatedClassName" : "MultiCodeDecoder",
160
+ "method" : "predict"
161
+ }
162
+ ]
MultiCodeDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
{Talker.mlmodelc → MultiCodeDecoder.mlmodelc}/weights/weight.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7ecf9b65affc83a8d09586e223e520d94ecbd015af8aa41d45e1af9a9647e95
3
- size 443812480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6576808c3628a4065e578154a9d2473b303cb8b1eb2516bb9f2595728fbd50f0
3
+ size 110234752
MultiCodeEmbedder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:217a014dd5f42957a214530704a9e1764035baa415d29d243a1df80d25e3e41b
3
+ size 243
MultiCodeEmbedder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dddbe801a9e029787cfa48d15ef2dad0606a617f9b719211c2c46e6698f30d56
3
+ size 380
MultiCodeEmbedder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Float16",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1024 × 1 × 1)",
11
+ "shortDescription" : "",
12
+ "shape" : "[1024, 1, 1]",
13
+ "name" : "input_embeds",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 9,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Select" : 1,
23
+ "Ios18.squeeze" : 2,
24
+ "Ios18.gather" : 1,
25
+ "Ios18.expandDims" : 2,
26
+ "Ios18.cast" : 3,
27
+ "Ios18.greaterEqual" : 1,
28
+ "Ios18.add" : 1
29
+ },
30
+ "computePrecision" : "Mixed (Float16, Int16, Int32)",
31
+ "isUpdatable" : "0",
32
+ "stateSchema" : [
33
+
34
+ ],
35
+ "availability" : {
36
+ "macOS" : "15.0",
37
+ "tvOS" : "18.0",
38
+ "visionOS" : "2.0",
39
+ "watchOS" : "11.0",
40
+ "iOS" : "18.0",
41
+ "macCatalyst" : "18.0"
42
+ },
43
+ "modelType" : {
44
+ "name" : "MLModelType_mlProgram"
45
+ },
46
+ "userDefinedMetadata" : {
47
+ "com.github.apple.coremltools.conversion_date" : "2026-03-30",
48
+ "com.github.apple.coremltools.source" : "torch==2.10.0",
49
+ "com.github.apple.coremltools.version" : "9.0",
50
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
51
+ },
52
+ "inputSchema" : [
53
+ {
54
+ "hasShapeFlexibility" : "0",
55
+ "isOptional" : "0",
56
+ "dataType" : "Int32",
57
+ "formattedType" : "MultiArray (Int32 1)",
58
+ "shortDescription" : "",
59
+ "shape" : "[1]",
60
+ "name" : "input_ids",
61
+ "type" : "MultiArray"
62
+ }
63
+ ],
64
+ "generatedClassName" : "MultiCodeEmbedder",
65
+ "method" : "predict"
66
+ }
67
+ ]
MultiCodeEmbedder.mlmodelc/model.mil ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ program(1.3)
2
+ [buildInfo = dict<string, string>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.10.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})]
3
+ {
4
+ func main<ios18>(tensor<int32, [1]> input_ids) {
5
+ int32 emb_batch_dims_0 = const()[name = string("emb_batch_dims_0"), val = int32(0)];
6
+ bool emb_validate_indices_0 = const()[name = string("emb_validate_indices_0"), val = bool(false)];
7
+ tensor<fp16, [30720, 1024]> embedding_weight_to_fp16 = const()[name = string("embedding_weight_to_fp16"), val = tensor<fp16, [30720, 1024]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64)))];
8
+ string input_ids_to_int16_dtype_0 = const()[name = string("input_ids_to_int16_dtype_0"), val = string("int16")];
9
+ string cast_2_dtype_0 = const()[name = string("cast_2_dtype_0"), val = string("int32")];
10
+ int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)];
11
+ tensor<int16, [1]> input_ids_to_int16 = cast(dtype = input_ids_to_int16_dtype_0, x = input_ids)[name = string("cast_5")];
12
+ tensor<int32, [1]> cast_2 = cast(dtype = cast_2_dtype_0, x = input_ids_to_int16)[name = string("cast_4")];
13
+ tensor<bool, [1]> greater_equal_0 = greater_equal(x = cast_2, y = greater_equal_0_y_0)[name = string("greater_equal_0")];
14
+ int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(30720)];
15
+ tensor<int32, [1]> add_0 = add(x = cast_2, y = slice_by_index_0)[name = string("add_0")];
16
+ tensor<int32, [1]> select_0 = select(a = cast_2, b = add_0, cond = greater_equal_0)[name = string("select_0")];
17
+ int32 emb_cast_fp16_cast_uint16_axis_0 = const()[name = string("emb_cast_fp16_cast_uint16_axis_0"), val = int32(0)];
18
+ string select_0_to_int16_dtype_0 = const()[name = string("select_0_to_int16_dtype_0"), val = string("int16")];
19
+ tensor<int16, [1]> select_0_to_int16 = cast(dtype = select_0_to_int16_dtype_0, x = select_0)[name = string("cast_3")];
20
+ tensor<fp16, [1, 1024]> emb_cast_fp16_cast_uint16_cast_uint16 = gather(axis = emb_cast_fp16_cast_uint16_axis_0, batch_dims = emb_batch_dims_0, indices = select_0_to_int16, validate_indices = emb_validate_indices_0, x = embedding_weight_to_fp16)[name = string("emb_cast_fp16_cast_uint16_cast_uint16")];
21
+ tensor<int32, [1]> var_8_axes_0 = const()[name = string("op_8_axes_0"), val = tensor<int32, [1]>([0])];
22
+ tensor<fp16, [1024]> var_8_cast_fp16 = squeeze(axes = var_8_axes_0, x = emb_cast_fp16_cast_uint16_cast_uint16)[name = string("op_8_cast_fp16")];
23
+ tensor<fp16, [1024]> var_10_cast_fp16 = squeeze(x = var_8_cast_fp16)[name = string("op_10_cast_fp16")];
24
+ tensor<int32, [1]> var_12_axes_0 = const()[name = string("op_12_axes_0"), val = tensor<int32, [1]>([-1])];
25
+ tensor<fp16, [1024, 1]> var_12_cast_fp16 = expand_dims(axes = var_12_axes_0, x = var_10_cast_fp16)[name = string("op_12_cast_fp16")];
26
+ tensor<int32, [1]> var_14_axes_0 = const()[name = string("op_14_axes_0"), val = tensor<int32, [1]>([-1])];
27
+ tensor<fp16, [1024, 1, 1]> input_embeds = expand_dims(axes = var_14_axes_0, x = var_12_cast_fp16)[name = string("op_14_cast_fp16")];
28
+ } -> (input_embeds);
29
+ }
MultiCodeEmbedder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9215324f237e6e41298eaca272ea0d6f0b6c10b36ee00fd1009e03f2b193485c
3
+ size 62914688
SpeechDecoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a79a81c5dcb274ad3102040cfe775bc2bcfcdf07a1940737027ea31b878f258d
3
+ size 243
SpeechDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65312a07616d4b78cad34ae7c37d3579a6b0316e04caa63ebf9aa1882473c99b
3
+ size 378
{MimiDecoder.mlmodelc → SpeechDecoder.mlmodelc}/metadata.json RENAMED
@@ -1,16 +1,16 @@
1
  [
2
  {
3
  "metadataOutputVersion" : "3.0",
4
- "storagePrecision" : "Float16",
5
  "outputSchema" : [
6
  {
7
  "hasShapeFlexibility" : "0",
8
  "isOptional" : "0",
9
  "dataType" : "Float16",
10
- "formattedType" : "MultiArray (Float16)",
11
  "shortDescription" : "",
12
- "shape" : "[]",
13
- "name" : "waveform",
14
  "type" : "MultiArray"
15
  }
16
  ],
@@ -20,31 +20,30 @@
20
  "specificationVersion" : 9,
21
  "mlProgramOperationTypeHistogram" : {
22
  "Ios18.softmax" : 8,
23
- "Ios18.mul" : 219,
24
  "Ios18.matmul" : 16,
25
  "Ios18.rsqrt" : 17,
26
  "Ios16.reduceMean" : 17,
27
  "Ios18.sin" : 29,
28
- "Ios18.greaterEqual" : 1,
29
- "Select" : 1,
30
- "Ios18.gather" : 24,
31
- "Ios18.add" : 116,
32
  "Ios18.layerNorm" : 2,
33
  "Ios18.reshape" : 32,
34
- "Shape" : 8,
35
  "Pad" : 17,
 
36
  "Ios18.linear" : 62,
37
  "Ios18.conv" : 31,
38
- "Ios18.concat" : 27,
39
- "Ios18.sub" : 16,
40
  "Ios18.transpose" : 40,
41
- "Ios18.cast" : 34,
42
- "Ios18.pow" : 17,
43
  "Ios18.silu" : 8,
44
  "Ios18.gelu" : 2,
 
45
  "Ios18.convTranspose" : 6,
46
- "Ios18.sliceByIndex" : 56,
47
- "Ios18.clip" : 1
48
  },
49
  "computePrecision" : "Mixed (Float16, Float32, Int16, Int32, UInt16)",
50
  "isUpdatable" : "0",
@@ -63,26 +62,24 @@
63
  "name" : "MLModelType_mlProgram"
64
  },
65
  "userDefinedMetadata" : {
66
- "com.github.apple.coremltools.conversion_date" : "2026-03-29",
67
  "com.github.apple.coremltools.source" : "torch==2.10.0",
68
  "com.github.apple.coremltools.version" : "9.0",
69
  "com.github.apple.coremltools.source_dialect" : "TorchScript"
70
  },
71
  "inputSchema" : [
72
  {
73
- "shortDescription" : "",
74
- "dataType" : "Int32",
75
- "hasShapeFlexibility" : "1",
76
  "isOptional" : "0",
77
- "shapeFlexibility" : "1 × 16 × 4 | 1 × 16 × 14 | 1 × 16 × 35 | 1 × 16 × 50",
78
- "formattedType" : "MultiArray (Int32 1 × 16 × 4)",
79
- "type" : "MultiArray",
80
- "shape" : "[1, 16, 4]",
81
- "name" : "codes",
82
- "enumeratedShapes" : "[[1, 16, 4], [1, 16, 14], [1, 16, 35], [1, 16, 50]]"
83
  }
84
  ],
85
- "generatedClassName" : "MimiDecoder",
86
  "method" : "predict"
87
  }
88
  ]
 
1
  [
2
  {
3
  "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Mixed (Float16, Palettized (8 bits), UInt8)",
5
  "outputSchema" : [
6
  {
7
  "hasShapeFlexibility" : "0",
8
  "isOptional" : "0",
9
  "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1 × 1 × 240000)",
11
  "shortDescription" : "",
12
+ "shape" : "[1, 1, 240000]",
13
+ "name" : "audio",
14
  "type" : "MultiArray"
15
  }
16
  ],
 
20
  "specificationVersion" : 9,
21
  "mlProgramOperationTypeHistogram" : {
22
  "Ios18.softmax" : 8,
23
+ "Ios18.mul" : 158,
24
  "Ios18.matmul" : 16,
25
  "Ios18.rsqrt" : 17,
26
  "Ios16.reduceMean" : 17,
27
  "Ios18.sin" : 29,
28
+ "Ios18.greaterEqual" : 2,
29
+ "Select" : 2,
30
+ "Ios18.gather" : 16,
31
+ "Ios18.add" : 117,
32
  "Ios18.layerNorm" : 2,
33
  "Ios18.reshape" : 32,
 
34
  "Pad" : 17,
35
+ "Ios18.constexprLutToDense" : 133,
36
  "Ios18.linear" : 62,
37
  "Ios18.conv" : 31,
38
+ "Ios18.concat" : 16,
 
39
  "Ios18.transpose" : 40,
40
+ "Ios18.cast" : 19,
41
+ "Ios18.pow" : 46,
42
  "Ios18.silu" : 8,
43
  "Ios18.gelu" : 2,
44
+ "Ios18.clip" : 1,
45
  "Ios18.convTranspose" : 6,
46
+ "Ios18.sliceByIndex" : 54
 
47
  },
48
  "computePrecision" : "Mixed (Float16, Float32, Int16, Int32, UInt16)",
49
  "isUpdatable" : "0",
 
62
  "name" : "MLModelType_mlProgram"
63
  },
64
  "userDefinedMetadata" : {
65
+ "com.github.apple.coremltools.conversion_date" : "2026-03-30",
66
  "com.github.apple.coremltools.source" : "torch==2.10.0",
67
  "com.github.apple.coremltools.version" : "9.0",
68
  "com.github.apple.coremltools.source_dialect" : "TorchScript"
69
  },
70
  "inputSchema" : [
71
  {
72
+ "hasShapeFlexibility" : "0",
 
 
73
  "isOptional" : "0",
74
+ "dataType" : "Int32",
75
+ "formattedType" : "MultiArray (Int32 1 × 16 × 125)",
76
+ "shortDescription" : "",
77
+ "shape" : "[1, 16, 125]",
78
+ "name" : "audio_codes",
79
+ "type" : "MultiArray"
80
  }
81
  ],
82
+ "generatedClassName" : "SpeechDecoder",
83
  "method" : "predict"
84
  }
85
  ]
SpeechDecoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
{CodePredictor.mlmodelc → SpeechDecoder.mlmodelc}/weights/weight.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:569ed049b7819129c6a83cce000a932c9cdc78ff7b5a5bf4e364278846222cae
3
- size 314651712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00a1ed6d52f41d82a8da012a1344f2df17d0b1d658957c5f2afa52a4b186d03d
3
+ size 114209024
Talker.mlmodelc/coremldata.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b2bac3c7bb2a17381413465a43834b013095bf4f23f1ae95d4c929f5f8675ca
3
- size 672
 
 
 
 
Talker.mlmodelc/model.mil DELETED
The diff for this file is too large to render. See raw diff
 
TextProjector.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3a2e57b7663be9f3871eb8b39b7c99da3b597bc6da4f416302d7ae5c8654f1d
3
+ size 243
TextProjector.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9beb53dcdd366de5a75e075dfec05c3289e92ccc39c624b42ac39811e90c3437
3
+ size 380
TextProjector.mlmodelc/metadata.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Mixed (Float16, Palettized (8 bits), UInt8)",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1024 × 1 × 1)",
11
+ "shortDescription" : "",
12
+ "shape" : "[1024, 1, 1]",
13
+ "name" : "input_embeds",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 9,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Select" : 2,
23
+ "Ios18.squeeze" : 2,
24
+ "Ios18.gather" : 1,
25
+ "Ios18.linear" : 2,
26
+ "Ios18.expandDims" : 2,
27
+ "Ios18.constexprLutToDense" : 3,
28
+ "Ios18.silu" : 1,
29
+ "Ios18.greaterEqual" : 2,
30
+ "Ios18.add" : 2
31
+ },
32
+ "computePrecision" : "Mixed (Float16, Int32)",
33
+ "isUpdatable" : "0",
34
+ "stateSchema" : [
35
+
36
+ ],
37
+ "availability" : {
38
+ "macOS" : "15.0",
39
+ "tvOS" : "18.0",
40
+ "visionOS" : "2.0",
41
+ "watchOS" : "11.0",
42
+ "iOS" : "18.0",
43
+ "macCatalyst" : "18.0"
44
+ },
45
+ "modelType" : {
46
+ "name" : "MLModelType_mlProgram"
47
+ },
48
+ "userDefinedMetadata" : {
49
+ "com.github.apple.coremltools.conversion_date" : "2026-03-30",
50
+ "com.github.apple.coremltools.source" : "torch==2.10.0",
51
+ "com.github.apple.coremltools.version" : "9.0",
52
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
53
+ },
54
+ "inputSchema" : [
55
+ {
56
+ "hasShapeFlexibility" : "0",
57
+ "isOptional" : "0",
58
+ "dataType" : "Int32",
59
+ "formattedType" : "MultiArray (Int32 1)",
60
+ "shortDescription" : "",
61
+ "shape" : "[1]",
62
+ "name" : "input_ids",
63
+ "type" : "MultiArray"
64
+ }
65
+ ],
66
+ "generatedClassName" : "TextProjector",
67
+ "method" : "predict"
68
+ }
69
+ ]
TextProjector.mlmodelc/model.mil ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ program(1.3)
2
+ [buildInfo = dict<string, string>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}})]
3
+ {
4
+ func main<ios18>(tensor<int32, [1]> input_ids) {
5
+ int32 input_1_batch_dims_0 = const()[name = string("input_1_batch_dims_0"), val = int32(0)];
6
+ bool input_1_validate_indices_0 = const()[name = string("input_1_validate_indices_0"), val = bool(false)];
7
+ tensor<fp16, [151936, 2048]> text_embedding_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint8, [151936, 2048]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor<fp16, [1, 1, 256, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(311165056))))[name = string("text_embedding_weight_to_fp16_palettized")];
8
+ int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)];
9
+ tensor<bool, [1]> greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = string("greater_equal_0")];
10
+ int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(151936)];
11
+ tensor<int32, [1]> add_0 = add(x = input_ids, y = slice_by_index_0)[name = string("add_0")];
12
+ tensor<int32, [1]> select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = string("select_0")];
13
+ int32 greater_equal_0_y_0_1 = const()[name = string("greater_equal_0_y_0_1"), val = int32(0)];
14
+ tensor<bool, [1]> greater_equal_0_1 = greater_equal(x = select_0, y = greater_equal_0_y_0_1)[name = string("greater_equal_0_1")];
15
+ int32 slice_by_index_0_1 = const()[name = string("slice_by_index_0_1"), val = int32(151936)];
16
+ tensor<int32, [1]> add_0_1 = add(x = select_0, y = slice_by_index_0_1)[name = string("add_0_1")];
17
+ tensor<int32, [1]> select_0_1 = select(a = select_0, b = add_0_1, cond = greater_equal_0_1)[name = string("select_0_1")];
18
+ int32 input_1_cast_fp16_axis_0 = const()[name = string("input_1_cast_fp16_axis_0"), val = int32(0)];
19
+ tensor<fp16, [1, 2048]> input_1_cast_fp16 = gather(axis = input_1_cast_fp16_axis_0, batch_dims = input_1_batch_dims_0, indices = select_0_1, validate_indices = input_1_validate_indices_0, x = text_embedding_weight_to_fp16_palettized)[name = string("input_1_cast_fp16")];
20
+ tensor<fp16, [2048, 2048]> text_projection_linear_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint8, [2048, 2048]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(311165632))), lut = tensor<fp16, [1, 1, 256, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315360000))))[name = string("text_projection_linear_fc1_weight_to_fp16_palettized")];
21
+ tensor<fp16, [2048]> text_projection_linear_fc1_bias_to_fp16 = const()[name = string("text_projection_linear_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315360576)))];
22
+ tensor<fp16, [1, 2048]> linear_0_cast_fp16 = linear(bias = text_projection_linear_fc1_bias_to_fp16, weight = text_projection_linear_fc1_weight_to_fp16_palettized, x = input_1_cast_fp16)[name = string("linear_0_cast_fp16")];
23
+ tensor<fp16, [1, 2048]> input_cast_fp16 = silu(x = linear_0_cast_fp16)[name = string("input_cast_fp16")];
24
+ tensor<fp16, [1024, 2048]> text_projection_linear_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint8, [1024, 2048]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315364736))), lut = tensor<fp16, [1, 1, 256, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(317461952))))[name = string("text_projection_linear_fc2_weight_to_fp16_palettized")];
25
+ tensor<fp16, [1024]> text_projection_linear_fc2_bias_to_fp16 = const()[name = string("text_projection_linear_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(317462528)))];
26
+ tensor<fp16, [1, 1024]> linear_1_cast_fp16 = linear(bias = text_projection_linear_fc2_bias_to_fp16, weight = text_projection_linear_fc2_weight_to_fp16_palettized, x = input_cast_fp16)[name = string("linear_1_cast_fp16")];
27
+ tensor<int32, [1]> var_18_axes_0 = const()[name = string("op_18_axes_0"), val = tensor<int32, [1]>([0])];
28
+ tensor<fp16, [1024]> var_18_cast_fp16 = squeeze(axes = var_18_axes_0, x = linear_1_cast_fp16)[name = string("op_18_cast_fp16")];
29
+ tensor<fp16, [1024]> var_20_cast_fp16 = squeeze(x = var_18_cast_fp16)[name = string("op_20_cast_fp16")];
30
+ tensor<int32, [1]> var_22_axes_0 = const()[name = string("op_22_axes_0"), val = tensor<int32, [1]>([-1])];
31
+ tensor<fp16, [1024, 1]> var_22_cast_fp16 = expand_dims(axes = var_22_axes_0, x = var_20_cast_fp16)[name = string("op_22_cast_fp16")];
32
+ tensor<int32, [1]> var_24_axes_0 = const()[name = string("op_24_axes_0"), val = tensor<int32, [1]>([-1])];
33
+ tensor<fp16, [1024, 1, 1]> input_embeds = expand_dims(axes = var_24_axes_0, x = var_22_cast_fp16)[name = string("op_24_cast_fp16")];
34
+ } -> (input_embeds);
35
+ }
TextProjector.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78ece3af64cde140b4a2fecdb4117461956b6887cff95d060adf23168b2f93d3
3
+ size 317464640
config.json CHANGED
@@ -1,15 +1,19 @@
1
  {
2
  "model_type": "qwen3_tts_coreml",
 
3
  "model_id": "Qwen/Qwen3-TTS-12Hz-0.6B-Base",
 
 
 
 
 
 
 
 
 
 
 
 
4
  "hidden_size": 1024,
5
- "num_layers": 28,
6
- "num_heads": 16,
7
- "num_kv_heads": 8,
8
- "head_dim": 128,
9
- "intermediate_size": 3072,
10
- "codec_vocab_size": 3072,
11
- "text_hidden_size": 2048,
12
- "text_vocab_size": 151936,
13
- "max_seq_len": 512,
14
- "quantization": "int8"
15
  }
 
1
  {
2
  "model_type": "qwen3_tts_coreml",
3
+ "architecture": "6-model-ane",
4
  "model_id": "Qwen/Qwen3-TTS-12Hz-0.6B-Base",
5
+ "models": [
6
+ "TextProjector",
7
+ "CodeEmbedder",
8
+ "MultiCodeEmbedder",
9
+ "CodeDecoder",
10
+ "MultiCodeDecoder",
11
+ "SpeechDecoder"
12
+ ],
13
+ "quantization": "W8A16",
14
+ "max_seq_len": 256,
15
+ "max_codec_tokens": 125,
16
+ "sample_rate": 24000,
17
  "hidden_size": 1024,
18
+ "requires_speaker_embedding": true
 
 
 
 
 
 
 
 
 
19
  }
embeddings.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc051095c79172639ea331308a35dcf7a242da6c99c8b56ff5347ed6df788d5e
3
- size 767042816
 
 
 
 
CodePredictor.mlmodelc/coremldata.bin → speaker_embedding.npy RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10759300000129103c06b834961616b4094b766d20ea2ae68fe216f0ae0293f9
3
- size 1509
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f4dbee4423ef6c15fcfbac5eeaefe2de2d7c2ffc305c81a1adefbf255aadfd4
3
+ size 4224
tts_bos_embed.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fa7ddf7338467bd9210725673f307f600e34817709d34b67f47eff3d8a5650c
3
+ size 4224
tts_eos_embed.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3edd5d5c1432e9129bd942683928f8ded011a0942cf66a34a7969d6062dbbdb8
3
+ size 4224
tts_pad_embed.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06d52c2f64113a6e027d622cb939d06e949137dc5a4ad92100432cf92ff25a89
3
+ size 4224