mweinbach1 commited on
Commit
10cbeb6
·
verified ·
1 Parent(s): 65c8d85

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .DS_Store +0 -0
  2. .gitattributes +1 -0
  3. config.json +4 -0
  4. merges.txt +0 -0
  5. meta.yaml +24 -0
  6. phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/analytics/coremldata.bin +3 -0
  7. phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/coremldata.bin +3 -0
  8. phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/metadata.json +299 -0
  9. phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/model.mil +0 -0
  10. phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/weights/weight.bin +3 -0
  11. phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  12. phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  13. phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Manifest.json +18 -0
  14. phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/analytics/coremldata.bin +3 -0
  15. phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/coremldata.bin +3 -0
  16. phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/metadata.json +299 -0
  17. phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/model.mil +0 -0
  18. phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/weights/weight.bin +3 -0
  19. phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  20. phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  21. phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Manifest.json +18 -0
  22. phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  23. phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  24. phi4_FFN_lut4_chunk_01of02.mlpackage/Manifest.json +18 -0
  25. phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  26. phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  27. phi4_FFN_lut4_chunk_02of02.mlpackage/Manifest.json +18 -0
  28. phi4_embeddings_lut8.mlmodelc/analytics/coremldata.bin +3 -0
  29. phi4_embeddings_lut8.mlmodelc/coremldata.bin +3 -0
  30. phi4_embeddings_lut8.mlmodelc/metadata.json +65 -0
  31. phi4_embeddings_lut8.mlmodelc/model.mil +21 -0
  32. phi4_embeddings_lut8.mlmodelc/weights/weight.bin +3 -0
  33. phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  34. phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  35. phi4_embeddings_lut8.mlpackage/Manifest.json +18 -0
  36. phi4_lm_head_lut6.mlmodelc/analytics/coremldata.bin +3 -0
  37. phi4_lm_head_lut6.mlmodelc/coremldata.bin +3 -0
  38. phi4_lm_head_lut6.mlmodelc/metadata.json +63 -0
  39. phi4_lm_head_lut6.mlmodelc/model.mil +17 -0
  40. phi4_lm_head_lut6.mlmodelc/weights/weight.bin +3 -0
  41. phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  42. phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  43. phi4_lm_head_lut6.mlpackage/Manifest.json +18 -0
  44. phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  45. phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  46. phi4_prefill_lut4_chunk_01of02.mlpackage/Manifest.json +18 -0
  47. phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
  48. phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
  49. phi4_prefill_lut4_chunk_02of02.mlpackage/Manifest.json +18 -0
  50. tokenizer.json +3 -0
.DS_Store ADDED
Binary file (6.15 kB). View file
 
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "tokenizer_class": "AutoTokenizer",
3
+ "model_type": "phi3"
4
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
meta.yaml ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_info:
2
+ name: anemll-5a149550068a1eb93398160d8953f5f56c3603e9-ctx2048
3
+ version: 0.3.0
4
+ description: |
5
+ Demonstarates running 5a149550068a1eb93398160d8953f5f56c3603e9 on Apple Neural Engine
6
+ Context length: 2048
7
+ Batch size: 64
8
+ Chunks: 2
9
+ license: MIT
10
+ author: Anemll
11
+ framework: Core ML
12
+ language: Python
13
+ parameters:
14
+ context_length: 2048
15
+ batch_size: 64
16
+ lut_embeddings: 8
17
+ lut_ffn: 4
18
+ lut_lmhead: 6
19
+ num_chunks: 2
20
+ model_prefix: phi4
21
+ embeddings: phi4_embeddings_lut8.mlmodelc
22
+ lm_head: phi4_lm_head_lut6.mlmodelc
23
+ ffn: phi4_FFN_PF_lut4.mlmodelc
24
+ split_lm_head: 1
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9100ee1f47c46d82899674cb8dd1267b7b3be5159f56687398744760d68e748a
3
+ size 243
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dea759822bbf8031a58a2da1da1d9cca24edc09a4ba2c8a1d49917d5cc02716
3
+ size 743
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/metadata.json ADDED
@@ -0,0 +1,299 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "userDefinedMetadata" : {
5
+ "com.github.apple.coremltools.source_dialect" : "TorchScript",
6
+ "com.github.apple.coremltools.source" : "torch==2.8.0",
7
+ "com.github.apple.coremltools.version" : "9.0b1",
8
+ "com.anemll.info" : "Converted with Anemll v0.3.4"
9
+ },
10
+ "availability" : {
11
+ "macOS" : "15.0",
12
+ "tvOS" : "18.0",
13
+ "visionOS" : "2.0",
14
+ "watchOS" : "11.0",
15
+ "iOS" : "18.0",
16
+ "macCatalyst" : "18.0"
17
+ },
18
+ "inputSchema" : [
19
+ {
20
+ "hasShapeFlexibility" : "0",
21
+ "isOptional" : "0",
22
+ "dataType" : "Float16",
23
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
24
+ "shortDescription" : "",
25
+ "shape" : "[1, 1, 3072]",
26
+ "name" : "hidden_states",
27
+ "type" : "MultiArray"
28
+ },
29
+ {
30
+ "hasShapeFlexibility" : "0",
31
+ "isOptional" : "0",
32
+ "dataType" : "Int32",
33
+ "formattedType" : "MultiArray (Int32 1)",
34
+ "shortDescription" : "",
35
+ "shape" : "[1]",
36
+ "name" : "position_ids",
37
+ "type" : "MultiArray"
38
+ },
39
+ {
40
+ "hasShapeFlexibility" : "0",
41
+ "isOptional" : "0",
42
+ "dataType" : "Float16",
43
+ "formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
44
+ "shortDescription" : "",
45
+ "shape" : "[1, 1, 1, 2048]",
46
+ "name" : "causal_mask",
47
+ "type" : "MultiArray"
48
+ },
49
+ {
50
+ "hasShapeFlexibility" : "0",
51
+ "isOptional" : "0",
52
+ "dataType" : "Int32",
53
+ "formattedType" : "MultiArray (Int32 1)",
54
+ "shortDescription" : "",
55
+ "shape" : "[1]",
56
+ "name" : "current_pos",
57
+ "type" : "MultiArray"
58
+ }
59
+ ],
60
+ "outputSchema" : [
61
+ {
62
+ "hasShapeFlexibility" : "0",
63
+ "isOptional" : "0",
64
+ "dataType" : "Float16",
65
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
66
+ "shortDescription" : "",
67
+ "shape" : "[1, 1, 3072]",
68
+ "name" : "output_hidden_states",
69
+ "type" : "MultiArray"
70
+ }
71
+ ],
72
+ "modelParameters" : [
73
+
74
+ ],
75
+ "storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
76
+ "method" : "predict",
77
+ "functions" : [
78
+ {
79
+ "inputSchema" : [
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float16",
84
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
85
+ "shortDescription" : "",
86
+ "shape" : "[1, 1, 3072]",
87
+ "name" : "hidden_states",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Int32",
94
+ "formattedType" : "MultiArray (Int32 1)",
95
+ "shortDescription" : "",
96
+ "shape" : "[1]",
97
+ "name" : "position_ids",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float16",
104
+ "formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
105
+ "shortDescription" : "",
106
+ "shape" : "[1, 1, 1, 2048]",
107
+ "name" : "causal_mask",
108
+ "type" : "MultiArray"
109
+ },
110
+ {
111
+ "hasShapeFlexibility" : "0",
112
+ "isOptional" : "0",
113
+ "dataType" : "Int32",
114
+ "formattedType" : "MultiArray (Int32 1)",
115
+ "shortDescription" : "",
116
+ "shape" : "[1]",
117
+ "name" : "current_pos",
118
+ "type" : "MultiArray"
119
+ }
120
+ ],
121
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
122
+ "storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
123
+ "stateSchema" : [
124
+
125
+ ],
126
+ "outputSchema" : [
127
+ {
128
+ "hasShapeFlexibility" : "0",
129
+ "isOptional" : "0",
130
+ "dataType" : "Float16",
131
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
132
+ "shortDescription" : "",
133
+ "shape" : "[1, 1, 3072]",
134
+ "name" : "output_hidden_states",
135
+ "type" : "MultiArray"
136
+ }
137
+ ],
138
+ "name" : "infer",
139
+ "mlProgramOperationTypeHistogram" : {
140
+ "Ios18.expandDims" : 69,
141
+ "Ios18.mul" : 194,
142
+ "Ios18.cos" : 1,
143
+ "Ios18.softmax" : 16,
144
+ "Ios18.matmul" : 33,
145
+ "Ios18.rsqrt" : 33,
146
+ "Identity" : 2,
147
+ "Ios16.reduceMean" : 33,
148
+ "Ios18.sin" : 1,
149
+ "Split" : 16,
150
+ "Select" : 1,
151
+ "Tile" : 32,
152
+ "Ios18.add" : 113,
153
+ "Ios16.fillLike" : 1,
154
+ "Ios18.sliceUpdate" : 32,
155
+ "Ios18.reshape" : 99,
156
+ "Ios18.constexprLutToDense" : 97,
157
+ "Ios18.conv" : 96,
158
+ "Ios18.concat" : 65,
159
+ "Ios18.cast" : 1,
160
+ "Ios18.transpose" : 18,
161
+ "Ios18.pow" : 33,
162
+ "Ios18.silu" : 16,
163
+ "Ios18.lessEqual" : 1,
164
+ "Ios18.sliceByIndex" : 160,
165
+ "Ios18.squeeze" : 16
166
+ }
167
+ },
168
+ {
169
+ "inputSchema" : [
170
+ {
171
+ "hasShapeFlexibility" : "0",
172
+ "isOptional" : "0",
173
+ "dataType" : "Float16",
174
+ "formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
175
+ "shortDescription" : "",
176
+ "shape" : "[1, 64, 3072]",
177
+ "name" : "hidden_states",
178
+ "type" : "MultiArray"
179
+ },
180
+ {
181
+ "hasShapeFlexibility" : "0",
182
+ "isOptional" : "0",
183
+ "dataType" : "Int32",
184
+ "formattedType" : "MultiArray (Int32 64)",
185
+ "shortDescription" : "",
186
+ "shape" : "[64]",
187
+ "name" : "position_ids",
188
+ "type" : "MultiArray"
189
+ },
190
+ {
191
+ "hasShapeFlexibility" : "0",
192
+ "isOptional" : "0",
193
+ "dataType" : "Float16",
194
+ "formattedType" : "MultiArray (Float16 1 × 1 × 64 × 2048)",
195
+ "shortDescription" : "",
196
+ "shape" : "[1, 1, 64, 2048]",
197
+ "name" : "causal_mask",
198
+ "type" : "MultiArray"
199
+ },
200
+ {
201
+ "hasShapeFlexibility" : "0",
202
+ "isOptional" : "0",
203
+ "dataType" : "Int32",
204
+ "formattedType" : "MultiArray (Int32 1)",
205
+ "shortDescription" : "",
206
+ "shape" : "[1]",
207
+ "name" : "current_pos",
208
+ "type" : "MultiArray"
209
+ }
210
+ ],
211
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
212
+ "storagePrecision" : "Mixed (Float16, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
213
+ "stateSchema" : [
214
+
215
+ ],
216
+ "outputSchema" : [
217
+ {
218
+ "hasShapeFlexibility" : "0",
219
+ "isOptional" : "0",
220
+ "dataType" : "Float16",
221
+ "formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
222
+ "shortDescription" : "",
223
+ "shape" : "[1, 64, 3072]",
224
+ "name" : "output_hidden_states",
225
+ "type" : "MultiArray"
226
+ }
227
+ ],
228
+ "name" : "prefill",
229
+ "mlProgramOperationTypeHistogram" : {
230
+ "Ios18.expandDims" : 67,
231
+ "Ios18.softmax" : 16,
232
+ "Ios18.cos" : 1,
233
+ "Ios18.mul" : 192,
234
+ "Ios18.matmul" : 33,
235
+ "Ios18.rsqrt" : 32,
236
+ "Identity" : 2,
237
+ "Ios16.reduceMean" : 32,
238
+ "Ios18.sin" : 1,
239
+ "Split" : 16,
240
+ "Tile" : 32,
241
+ "Ios18.add" : 112,
242
+ "Ios18.sliceUpdate" : 32,
243
+ "Ios18.reshape" : 98,
244
+ "Ios18.constexprLutToDense" : 97,
245
+ "Ios18.conv" : 96,
246
+ "Ios18.concat" : 65,
247
+ "Ios18.cast" : 1,
248
+ "Ios18.transpose" : 80,
249
+ "Ios18.pow" : 32,
250
+ "Ios18.silu" : 16,
251
+ "Ios18.sliceByIndex" : 160,
252
+ "Ios18.squeeze" : 16
253
+ }
254
+ }
255
+ ],
256
+ "version" : "0.3.4",
257
+ "isUpdatable" : "0",
258
+ "defaultFunctionName" : "infer",
259
+ "specificationVersion" : 9,
260
+ "stateSchema" : [
261
+
262
+ ],
263
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
264
+ "mlProgramOperationTypeHistogram" : {
265
+ "Ios18.expandDims" : 69,
266
+ "Ios18.mul" : 194,
267
+ "Ios18.cos" : 1,
268
+ "Ios18.softmax" : 16,
269
+ "Ios18.matmul" : 33,
270
+ "Ios18.rsqrt" : 33,
271
+ "Identity" : 2,
272
+ "Ios16.reduceMean" : 33,
273
+ "Ios18.sin" : 1,
274
+ "Split" : 16,
275
+ "Select" : 1,
276
+ "Tile" : 32,
277
+ "Ios18.add" : 113,
278
+ "Ios16.fillLike" : 1,
279
+ "Ios18.sliceUpdate" : 32,
280
+ "Ios18.reshape" : 99,
281
+ "Ios18.constexprLutToDense" : 97,
282
+ "Ios18.conv" : 96,
283
+ "Ios18.concat" : 65,
284
+ "Ios18.cast" : 1,
285
+ "Ios18.transpose" : 18,
286
+ "Ios18.pow" : 33,
287
+ "Ios18.silu" : 16,
288
+ "Ios18.lessEqual" : 1,
289
+ "Ios18.sliceByIndex" : 160,
290
+ "Ios18.squeeze" : 16
291
+ },
292
+ "shortDescription" : "Anemll Model: Multifunction Combined",
293
+ "generatedClassName" : "phi4_FFN_PF_lut4_chunk_01of02",
294
+ "author" : "Converted with Anemll v0.3.4",
295
+ "modelType" : {
296
+ "name" : "MLModelType_mlProgram"
297
+ }
298
+ }
299
+ ]
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9b1a80fd917817620853cba6084cc50181eb31bebd4b51c03242c3a60714cfa
3
+ size 942252864
phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ab2caaac8f312247b29b5373e405721bb43fc2afd9981a0d0969c8aeb367071
3
+ size 946777
phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9b1a80fd917817620853cba6084cc50181eb31bebd4b51c03242c3a60714cfa
3
+ size 942252864
phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "3ED36C90-09E7-454E-993A-613AD9D0DBA7": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "56CB52E7-E373-4A88-A618-FABF77025DEB": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "3ED36C90-09E7-454E-993A-613AD9D0DBA7"
18
+ }
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d459fd207688db500187a3718f7e766ec41fcd451e5e5c621a05d084d401385a
3
+ size 243
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:572b886153dff5be6f240438c1f30e1c5effc7454ae5f9915baa30719bbe7fe7
3
+ size 743
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/metadata.json ADDED
@@ -0,0 +1,299 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "userDefinedMetadata" : {
5
+ "com.github.apple.coremltools.version" : "9.0b1",
6
+ "com.github.apple.coremltools.source" : "torch==2.8.0",
7
+ "com.anemll.info" : "Converted with Anemll v0.3.4",
8
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
9
+ },
10
+ "availability" : {
11
+ "macOS" : "15.0",
12
+ "tvOS" : "18.0",
13
+ "visionOS" : "2.0",
14
+ "watchOS" : "11.0",
15
+ "iOS" : "18.0",
16
+ "macCatalyst" : "18.0"
17
+ },
18
+ "inputSchema" : [
19
+ {
20
+ "hasShapeFlexibility" : "0",
21
+ "isOptional" : "0",
22
+ "dataType" : "Float16",
23
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
24
+ "shortDescription" : "",
25
+ "shape" : "[1, 1, 3072]",
26
+ "name" : "hidden_states",
27
+ "type" : "MultiArray"
28
+ },
29
+ {
30
+ "hasShapeFlexibility" : "0",
31
+ "isOptional" : "0",
32
+ "dataType" : "Int32",
33
+ "formattedType" : "MultiArray (Int32 1)",
34
+ "shortDescription" : "",
35
+ "shape" : "[1]",
36
+ "name" : "position_ids",
37
+ "type" : "MultiArray"
38
+ },
39
+ {
40
+ "hasShapeFlexibility" : "0",
41
+ "isOptional" : "0",
42
+ "dataType" : "Float16",
43
+ "formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
44
+ "shortDescription" : "",
45
+ "shape" : "[1, 1, 1, 2048]",
46
+ "name" : "causal_mask",
47
+ "type" : "MultiArray"
48
+ },
49
+ {
50
+ "hasShapeFlexibility" : "0",
51
+ "isOptional" : "0",
52
+ "dataType" : "Int32",
53
+ "formattedType" : "MultiArray (Int32 1)",
54
+ "shortDescription" : "",
55
+ "shape" : "[1]",
56
+ "name" : "current_pos",
57
+ "type" : "MultiArray"
58
+ }
59
+ ],
60
+ "outputSchema" : [
61
+ {
62
+ "hasShapeFlexibility" : "0",
63
+ "isOptional" : "0",
64
+ "dataType" : "Float16",
65
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
66
+ "shortDescription" : "",
67
+ "shape" : "[1, 1, 3072]",
68
+ "name" : "output_hidden_states",
69
+ "type" : "MultiArray"
70
+ }
71
+ ],
72
+ "modelParameters" : [
73
+
74
+ ],
75
+ "storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
76
+ "method" : "predict",
77
+ "functions" : [
78
+ {
79
+ "inputSchema" : [
80
+ {
81
+ "hasShapeFlexibility" : "0",
82
+ "isOptional" : "0",
83
+ "dataType" : "Float16",
84
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
85
+ "shortDescription" : "",
86
+ "shape" : "[1, 1, 3072]",
87
+ "name" : "hidden_states",
88
+ "type" : "MultiArray"
89
+ },
90
+ {
91
+ "hasShapeFlexibility" : "0",
92
+ "isOptional" : "0",
93
+ "dataType" : "Int32",
94
+ "formattedType" : "MultiArray (Int32 1)",
95
+ "shortDescription" : "",
96
+ "shape" : "[1]",
97
+ "name" : "position_ids",
98
+ "type" : "MultiArray"
99
+ },
100
+ {
101
+ "hasShapeFlexibility" : "0",
102
+ "isOptional" : "0",
103
+ "dataType" : "Float16",
104
+ "formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
105
+ "shortDescription" : "",
106
+ "shape" : "[1, 1, 1, 2048]",
107
+ "name" : "causal_mask",
108
+ "type" : "MultiArray"
109
+ },
110
+ {
111
+ "hasShapeFlexibility" : "0",
112
+ "isOptional" : "0",
113
+ "dataType" : "Int32",
114
+ "formattedType" : "MultiArray (Int32 1)",
115
+ "shortDescription" : "",
116
+ "shape" : "[1]",
117
+ "name" : "current_pos",
118
+ "type" : "MultiArray"
119
+ }
120
+ ],
121
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
122
+ "storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
123
+ "stateSchema" : [
124
+
125
+ ],
126
+ "outputSchema" : [
127
+ {
128
+ "hasShapeFlexibility" : "0",
129
+ "isOptional" : "0",
130
+ "dataType" : "Float16",
131
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
132
+ "shortDescription" : "",
133
+ "shape" : "[1, 1, 3072]",
134
+ "name" : "output_hidden_states",
135
+ "type" : "MultiArray"
136
+ }
137
+ ],
138
+ "name" : "infer",
139
+ "mlProgramOperationTypeHistogram" : {
140
+ "Ios18.expandDims" : 69,
141
+ "Ios18.mul" : 194,
142
+ "Ios18.cos" : 1,
143
+ "Ios18.softmax" : 16,
144
+ "Ios18.matmul" : 33,
145
+ "Ios18.rsqrt" : 33,
146
+ "Identity" : 2,
147
+ "Ios16.reduceMean" : 33,
148
+ "Ios18.sin" : 1,
149
+ "Split" : 16,
150
+ "Select" : 1,
151
+ "Tile" : 32,
152
+ "Ios18.add" : 113,
153
+ "Ios16.fillLike" : 1,
154
+ "Ios18.sliceUpdate" : 32,
155
+ "Ios18.reshape" : 99,
156
+ "Ios18.constexprLutToDense" : 97,
157
+ "Ios18.conv" : 96,
158
+ "Ios18.concat" : 65,
159
+ "Ios18.cast" : 1,
160
+ "Ios18.transpose" : 18,
161
+ "Ios18.pow" : 33,
162
+ "Ios18.silu" : 16,
163
+ "Ios18.lessEqual" : 1,
164
+ "Ios18.sliceByIndex" : 160,
165
+ "Ios18.squeeze" : 16
166
+ }
167
+ },
168
+ {
169
+ "inputSchema" : [
170
+ {
171
+ "hasShapeFlexibility" : "0",
172
+ "isOptional" : "0",
173
+ "dataType" : "Float16",
174
+ "formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
175
+ "shortDescription" : "",
176
+ "shape" : "[1, 64, 3072]",
177
+ "name" : "hidden_states",
178
+ "type" : "MultiArray"
179
+ },
180
+ {
181
+ "hasShapeFlexibility" : "0",
182
+ "isOptional" : "0",
183
+ "dataType" : "Int32",
184
+ "formattedType" : "MultiArray (Int32 64)",
185
+ "shortDescription" : "",
186
+ "shape" : "[64]",
187
+ "name" : "position_ids",
188
+ "type" : "MultiArray"
189
+ },
190
+ {
191
+ "hasShapeFlexibility" : "0",
192
+ "isOptional" : "0",
193
+ "dataType" : "Float16",
194
+ "formattedType" : "MultiArray (Float16 1 × 1 × 64 × 2048)",
195
+ "shortDescription" : "",
196
+ "shape" : "[1, 1, 64, 2048]",
197
+ "name" : "causal_mask",
198
+ "type" : "MultiArray"
199
+ },
200
+ {
201
+ "hasShapeFlexibility" : "0",
202
+ "isOptional" : "0",
203
+ "dataType" : "Int32",
204
+ "formattedType" : "MultiArray (Int32 1)",
205
+ "shortDescription" : "",
206
+ "shape" : "[1]",
207
+ "name" : "current_pos",
208
+ "type" : "MultiArray"
209
+ }
210
+ ],
211
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
212
+ "storagePrecision" : "Mixed (Float16, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
213
+ "stateSchema" : [
214
+
215
+ ],
216
+ "outputSchema" : [
217
+ {
218
+ "hasShapeFlexibility" : "0",
219
+ "isOptional" : "0",
220
+ "dataType" : "Float16",
221
+ "formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
222
+ "shortDescription" : "",
223
+ "shape" : "[1, 64, 3072]",
224
+ "name" : "output_hidden_states",
225
+ "type" : "MultiArray"
226
+ }
227
+ ],
228
+ "name" : "prefill",
229
+ "mlProgramOperationTypeHistogram" : {
230
+ "Ios18.expandDims" : 67,
231
+ "Ios18.softmax" : 16,
232
+ "Ios18.cos" : 1,
233
+ "Ios18.mul" : 192,
234
+ "Ios18.matmul" : 33,
235
+ "Ios18.rsqrt" : 32,
236
+ "Identity" : 2,
237
+ "Ios16.reduceMean" : 32,
238
+ "Ios18.sin" : 1,
239
+ "Split" : 16,
240
+ "Tile" : 32,
241
+ "Ios18.add" : 112,
242
+ "Ios18.sliceUpdate" : 32,
243
+ "Ios18.reshape" : 98,
244
+ "Ios18.constexprLutToDense" : 97,
245
+ "Ios18.conv" : 96,
246
+ "Ios18.concat" : 65,
247
+ "Ios18.cast" : 1,
248
+ "Ios18.transpose" : 80,
249
+ "Ios18.pow" : 32,
250
+ "Ios18.silu" : 16,
251
+ "Ios18.sliceByIndex" : 160,
252
+ "Ios18.squeeze" : 16
253
+ }
254
+ }
255
+ ],
256
+ "version" : "0.3.4",
257
+ "isUpdatable" : "0",
258
+ "defaultFunctionName" : "infer",
259
+ "specificationVersion" : 9,
260
+ "stateSchema" : [
261
+
262
+ ],
263
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
264
+ "mlProgramOperationTypeHistogram" : {
265
+ "Ios18.expandDims" : 69,
266
+ "Ios18.mul" : 194,
267
+ "Ios18.cos" : 1,
268
+ "Ios18.softmax" : 16,
269
+ "Ios18.matmul" : 33,
270
+ "Ios18.rsqrt" : 33,
271
+ "Identity" : 2,
272
+ "Ios16.reduceMean" : 33,
273
+ "Ios18.sin" : 1,
274
+ "Split" : 16,
275
+ "Select" : 1,
276
+ "Tile" : 32,
277
+ "Ios18.add" : 113,
278
+ "Ios16.fillLike" : 1,
279
+ "Ios18.sliceUpdate" : 32,
280
+ "Ios18.reshape" : 99,
281
+ "Ios18.constexprLutToDense" : 97,
282
+ "Ios18.conv" : 96,
283
+ "Ios18.concat" : 65,
284
+ "Ios18.cast" : 1,
285
+ "Ios18.transpose" : 18,
286
+ "Ios18.pow" : 33,
287
+ "Ios18.silu" : 16,
288
+ "Ios18.lessEqual" : 1,
289
+ "Ios18.sliceByIndex" : 160,
290
+ "Ios18.squeeze" : 16
291
+ },
292
+ "shortDescription" : "Anemll Model: Multifunction Combined",
293
+ "generatedClassName" : "phi4_FFN_PF_lut4_chunk_02of02",
294
+ "author" : "Converted with Anemll v0.3.4",
295
+ "modelType" : {
296
+ "name" : "MLModelType_mlProgram"
297
+ }
298
+ }
299
+ ]
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7cddf51a23eccf8537aff0f49164d219a60b12dcfabab1a51b297eed9104d0d
3
+ size 942252864
phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0deac5f27f9d44bdea9ad7c01884078b050749a8a146535c70762679ac9f04de
3
+ size 947140
phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7cddf51a23eccf8537aff0f49164d219a60b12dcfabab1a51b297eed9104d0d
3
+ size 942252864
phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "30CD2E36-07C5-46C1-A067-C7AF3DF75B14": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "4B6D69A1-DA28-4E09-B239-28E2E3CAD832": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "30CD2E36-07C5-46C1-A067-C7AF3DF75B14"
18
+ }
phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:586eb631c94781bc7fb29b0dba9f94aed96c38cc9886abc87e283e62fb597837
3
+ size 465885
phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ce2dab2f6ca3968850368574439596cbc90af797aa8b887ad7bf556c3975c27
3
+ size 941536064
phi4_FFN_lut4_chunk_01of02.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "10C45FAA-C192-4B04-A068-94CC88D24529": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "CD944379-EDFB-49EF-BF36-AD1F74C8E637": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "10C45FAA-C192-4B04-A068-94CC88D24529"
18
+ }
phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01da65b3bc03491a84d0f48d5de5ad0355492b8d176244ce4fcf65f5b128ebe4
3
+ size 466038
phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4b93c86e74522162838912ec96960a71fb56953b9a9cc173fe9d2f02b93938e
3
+ size 941536064
phi4_FFN_lut4_chunk_02of02.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "07A9AE1F-BD5F-43F9-9786-BF4AD9AA7067": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "9335DBFF-822F-4875-917B-186684CE3051": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "07A9AE1F-BD5F-43F9-9786-BF4AD9AA7067"
18
+ }
phi4_embeddings_lut8.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3c9e2c0ee2c9a3a599d109ae298f4474e53fba48d154a57b4a84513f70c6f0a
3
+ size 243
phi4_embeddings_lut8.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc923709421bf358759efcb64df7f19bf8e30bcfbf8aa0dc878c7fa229cf4b6c
3
+ size 383
phi4_embeddings_lut8.mlmodelc/metadata.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Mixed (Float16, Palettized (23 bits), UInt8)",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
11
+ "shortDescription" : "",
12
+ "shape" : "[1, 1, 3072]",
13
+ "name" : "hidden_states",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 9,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Ios18.greaterEqual" : 2,
23
+ "Ios18.constexprLutToDense" : 1,
24
+ "Ios18.add" : 2,
25
+ "Select" : 2,
26
+ "Ios18.gather" : 1
27
+ },
28
+ "computePrecision" : "Mixed (Float16, Int32)",
29
+ "isUpdatable" : "0",
30
+ "stateSchema" : [
31
+
32
+ ],
33
+ "availability" : {
34
+ "macOS" : "15.0",
35
+ "tvOS" : "18.0",
36
+ "visionOS" : "2.0",
37
+ "watchOS" : "11.0",
38
+ "iOS" : "18.0",
39
+ "macCatalyst" : "18.0"
40
+ },
41
+ "modelType" : {
42
+ "name" : "MLModelType_mlProgram"
43
+ },
44
+ "userDefinedMetadata" : {
45
+ "com.github.apple.coremltools.conversion_date" : "2025-09-28",
46
+ "com.github.apple.coremltools.source" : "torch==2.8.0",
47
+ "com.github.apple.coremltools.version" : "9.0b1",
48
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
49
+ },
50
+ "inputSchema" : [
51
+ {
52
+ "hasShapeFlexibility" : "0",
53
+ "isOptional" : "0",
54
+ "dataType" : "Int32",
55
+ "formattedType" : "MultiArray (Int32 1 × 1)",
56
+ "shortDescription" : "",
57
+ "shape" : "[1, 1]",
58
+ "name" : "input_ids",
59
+ "type" : "MultiArray"
60
+ }
61
+ ],
62
+ "generatedClassName" : "phi4_embeddings_lut8",
63
+ "method" : "predict"
64
+ }
65
+ ]
phi4_embeddings_lut8.mlmodelc/model.mil ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ program(1.3)
2
+ [buildInfo = dict<string, string>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}})]
3
+ {
4
+ func main<ios18>(tensor<int32, [1, 1]> input_ids) {
5
+ int32 var_6_batch_dims_0 = const()[name = string("op_6_batch_dims_0"), val = int32(0)];
6
+ bool var_6_validate_indices_0 = const()[name = string("op_6_validate_indices_0"), val = bool(false)];
7
+ tensor<fp16, [200064, 3072]> embed_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint8, [200064, 3072]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor<fp16, [25008, 1, 256, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(614596736))))[name = string("embed_weight_to_fp16_palettized")];
8
+ int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)];
9
+ tensor<bool, [1, 1]> greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = string("greater_equal_0")];
10
+ int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(200064)];
11
+ tensor<int32, [1, 1]> add_0 = add(x = input_ids, y = slice_by_index_0)[name = string("add_0")];
12
+ tensor<int32, [1, 1]> select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = string("select_0")];
13
+ int32 greater_equal_0_y_0_1 = const()[name = string("greater_equal_0_y_0_1"), val = int32(0)];
14
+ tensor<bool, [1, 1]> greater_equal_0_1 = greater_equal(x = select_0, y = greater_equal_0_y_0_1)[name = string("greater_equal_0_1")];
15
+ int32 slice_by_index_0_1 = const()[name = string("slice_by_index_0_1"), val = int32(200064)];
16
+ tensor<int32, [1, 1]> add_0_1 = add(x = select_0, y = slice_by_index_0_1)[name = string("add_0_1")];
17
+ tensor<int32, [1, 1]> select_0_1 = select(a = select_0, b = add_0_1, cond = greater_equal_0_1)[name = string("select_0_1")];
18
+ int32 op_6_cast_fp16_axis_0 = const()[name = string("op_6_cast_fp16_axis_0"), val = int32(0)];
19
+ tensor<fp16, [1, 1, 3072]> hidden_states = gather(axis = op_6_cast_fp16_axis_0, batch_dims = var_6_batch_dims_0, indices = select_0_1, validate_indices = var_6_validate_indices_0, x = embed_weight_to_fp16_palettized)[name = string("op_6_cast_fp16")];
20
+ } -> (hidden_states);
21
+ }
phi4_embeddings_lut8.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:471ccac8a8d66e8f8a024ce8b98f037dd31fa3bac450fdb53f1c8e3308ee011a
3
+ size 627400896
phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92af5fae585670c8e37cafbf73971a02bd75b8c102ec6ab9af0aaa723aa672b0
3
+ size 2526
phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:471ccac8a8d66e8f8a024ce8b98f037dd31fa3bac450fdb53f1c8e3308ee011a
3
+ size 627400896
phi4_embeddings_lut8.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "61B24E7A-D867-4391-A38F-50F28BF7D5FD": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "7BCAECDE-96CA-47ED-ABB9-3F6559A9D4F4": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "61B24E7A-D867-4391-A38F-50F28BF7D5FD"
18
+ }
phi4_lm_head_lut6.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d17ebd64d18ae52309635d5106ef6270ad518ededa11856b6c50bdc201c68e2
3
+ size 243
phi4_lm_head_lut6.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22a2a16ffd4f1e687322b91095caa994c6a27c2b1616dc92ec3f3f5a429895c1
3
+ size 383
phi4_lm_head_lut6.mlmodelc/metadata.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Mixed (Float16, Palettized (21 bits), UInt6)",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float16",
10
+ "formattedType" : "MultiArray (Float16 1 × 1 × 200064)",
11
+ "shortDescription" : "",
12
+ "shape" : "[1, 1, 200064]",
13
+ "name" : "logits",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 9,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Ios18.constexprLutToDense" : 1,
23
+ "Ios18.transpose" : 2,
24
+ "Ios18.conv" : 1
25
+ },
26
+ "computePrecision" : "Mixed (Float16, Int32)",
27
+ "isUpdatable" : "0",
28
+ "stateSchema" : [
29
+
30
+ ],
31
+ "availability" : {
32
+ "macOS" : "15.0",
33
+ "tvOS" : "18.0",
34
+ "visionOS" : "2.0",
35
+ "watchOS" : "11.0",
36
+ "iOS" : "18.0",
37
+ "macCatalyst" : "18.0"
38
+ },
39
+ "modelType" : {
40
+ "name" : "MLModelType_mlProgram"
41
+ },
42
+ "userDefinedMetadata" : {
43
+ "com.github.apple.coremltools.conversion_date" : "2025-09-28",
44
+ "com.github.apple.coremltools.source" : "torch==2.8.0",
45
+ "com.github.apple.coremltools.version" : "9.0b1",
46
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
47
+ },
48
+ "inputSchema" : [
49
+ {
50
+ "hasShapeFlexibility" : "0",
51
+ "isOptional" : "0",
52
+ "dataType" : "Float16",
53
+ "formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
54
+ "shortDescription" : "",
55
+ "shape" : "[1, 1, 3072]",
56
+ "name" : "hidden_states",
57
+ "type" : "MultiArray"
58
+ }
59
+ ],
60
+ "generatedClassName" : "phi4_lm_head_lut6",
61
+ "method" : "predict"
62
+ }
63
+ ]
phi4_lm_head_lut6.mlmodelc/model.mil ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ program(1.3)
2
+ [buildInfo = dict<string, string>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}})]
3
+ {
4
+ func main<ios18>(tensor<fp16, [1, 1, 3072]> hidden_states) {
5
+ tensor<int32, [3]> var_6 = const()[name = string("op_6"), val = tensor<int32, [3]>([0, 2, 1])];
6
+ string var_22_pad_type_0 = const()[name = string("op_22_pad_type_0"), val = string("valid")];
7
+ int32 var_22_groups_0 = const()[name = string("op_22_groups_0"), val = int32(1)];
8
+ tensor<int32, [1]> var_22_strides_0 = const()[name = string("op_22_strides_0"), val = tensor<int32, [1]>([1])];
9
+ tensor<int32, [2]> var_22_pad_0 = const()[name = string("op_22_pad_0"), val = tensor<int32, [2]>([0, 0])];
10
+ tensor<int32, [1]> var_22_dilations_0 = const()[name = string("op_22_dilations_0"), val = tensor<int32, [1]>([1])];
11
+ tensor<fp16, [200064, 3072, 1]> squeeze_0_cast_fp16_to_fp32_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint6, [200064, 3072, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor<fp16, [25008, 1, 1, 64, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(460947584))))[name = string("squeeze_0_cast_fp16_to_fp32_to_fp16_palettized")];
12
+ tensor<fp16, [1, 3072, 1]> var_7_cast_fp16 = transpose(perm = var_6, x = hidden_states)[name = string("transpose_1")];
13
+ tensor<fp16, [1, 200064, 1]> var_22_cast_fp16 = conv(dilations = var_22_dilations_0, groups = var_22_groups_0, pad = var_22_pad_0, pad_type = var_22_pad_type_0, strides = var_22_strides_0, weight = squeeze_0_cast_fp16_to_fp32_to_fp16_palettized, x = var_7_cast_fp16)[name = string("op_22_cast_fp16")];
14
+ tensor<int32, [3]> var_26 = const()[name = string("op_26"), val = tensor<int32, [3]>([0, 2, 1])];
15
+ tensor<fp16, [1, 1, 200064]> logits = transpose(perm = var_26, x = var_22_cast_fp16)[name = string("transpose_0")];
16
+ } -> (logits);
17
+ }
phi4_lm_head_lut6.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1620b615ef8cd96a1087ca6fba635eebcc22398c4174ad45ef18dde785d365a
3
+ size 464148672
phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e7803878a76f9ada016ee6d8016448971188293a7ae6694eedc1d4ef86fb583
3
+ size 2080
phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1620b615ef8cd96a1087ca6fba635eebcc22398c4174ad45ef18dde785d365a
3
+ size 464148672
phi4_lm_head_lut6.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "3528B6F8-359A-47AB-9099-3E9C4121A65A": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Weights",
7
+ "name": "weights",
8
+ "path": "com.apple.CoreML/weights"
9
+ },
10
+ "5C3068C5-09B3-469D-9E30-D89DCD3242BA": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Specification",
13
+ "name": "model.mlmodel",
14
+ "path": "com.apple.CoreML/model.mlmodel"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "5C3068C5-09B3-469D-9E30-D89DCD3242BA"
18
+ }
phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c7dffe2693f54d774fd943549a8029ebf7997991bb633be036c3761b5e97f3f
3
+ size 481032
phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea0e5d1ec01f7d0a8c55c98384c211456ab42d35799ed274e3787bb86cf1d1b8
3
+ size 942029504
phi4_prefill_lut4_chunk_01of02.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "CF8A09C1-D506-45BD-80A3-4E36C2529334": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Weights",
7
+ "name": "weights",
8
+ "path": "com.apple.CoreML/weights"
9
+ },
10
+ "DA5F8CFD-5833-43DD-A9BD-0981D832D125": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Specification",
13
+ "name": "model.mlmodel",
14
+ "path": "com.apple.CoreML/model.mlmodel"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "DA5F8CFD-5833-43DD-A9BD-0981D832D125"
18
+ }
phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e0b8e9e132180bed768bc88e6aaa4a2056a0a6506815caf8d1090b1e6becd1f
3
+ size 481242
phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7344a9ff4bcc5c1e124c7e110973d957cd6ddeafc603e9701b684076678969d4
3
+ size 942029504
phi4_prefill_lut4_chunk_02of02.mlpackage/Manifest.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fileFormatVersion": "1.0.0",
3
+ "itemInfoEntries": {
4
+ "05D6FC91-3A2E-4B17-975D-AF311B32C225": {
5
+ "author": "com.apple.CoreML",
6
+ "description": "CoreML Model Specification",
7
+ "name": "model.mlmodel",
8
+ "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "A203C972-22D7-4829-B187-257027B2E637": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
+ }
16
+ },
17
+ "rootModelIdentifier": "05D6FC91-3A2E-4B17-975D-AF311B32C225"
18
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:382cc235b56c725945e149cc25f191da667c836655efd0857b004320e90e91ea
3
+ size 15524095